riscv_machine_timer: fix maximum allowed cycles between reports There are two issues being fixed here: 1) The code currently clamps timeout length so not to overflow the computed cycle difference variable or the sys_clock_announce() argument's range. But this completely fails to take into account the case where two successive timeouts with enough time between them will still overflow the cycle difference and/or the tick count. 2) If a timeout with K_TICKS_FOREVER is provided then the comparator is set with UINT64_MAX which is bogus. Not only this value doesn't make much sense in the context of a running cycle counter, but it also opens the possibility for the same cycle diff and/or ticks overflow as above. Fix both of those by clamping the actual number of cycles to wait for based on the previous report occurrence rather than clamping the timeout ticks. Signed-off-by: Nicolas Pitre <npitre@baylibre.com>

commit: 0ea64b3ecb6438735d25e6490daa979e4c79dc3e [log] [tgz]
author: Nicolas Pitre <npitre@baylibre.com> Fri May 03 17:33:30 2024 -0400
committer: Anas Nashif <anas.nashif@intel.com> Tue May 07 21:22:12 2024 -0400
tree: 8678a437c2ac856b67d3181baaea202957944266
parent: 3f07d4b6abb31d701506b5970e83ba5de5d509d2 [diff]
diff --git a/drivers/timer/riscv_machine_timer.c b/drivers/timer/riscv_machine_timer.c
index abfb28a..36e29c6 100644
--- a/drivers/timer/riscv_machine_timer.c
+++ b/drivers/timer/riscv_machine_timer.c

@@ -78,6 +78,32 @@
 
 /* the unsigned long cast limits divisions to native CPU register width */
 #define cycle_diff_t unsigned long
+#define CYCLE_DIFF_MAX (~(cycle_diff_t)0)
+
+/*
+ * We have two constraints on the maximum number of cycles we can wait for.
+ *
+ * 1) sys_clock_announce() accepts at most INT32_MAX ticks.
+ *
+ * 2) The number of cycles between two reports must fit in a cycle_diff_t
+ *    variable before converting it to ticks.
+ *
+ * Then:
+ *
+ * 3) Pick the smallest between (1) and (2).
+ *
+ * 4) Take into account some room for the unavoidable IRQ servicing latency.
+ *    Let's use 3/4 of the max range.
+ *
+ * Finally let's add the LSB value to the result so to clear out a bunch of
+ * consecutive set bits coming from the original max values to produce a
+ * nicer literal for assembly generation.
+ */
+#define CYCLES_MAX_1	((uint64_t)INT32_MAX * (uint64_t)CYC_PER_TICK)
+#define CYCLES_MAX_2	((uint64_t)CYCLE_DIFF_MAX)
+#define CYCLES_MAX_3	MIN(CYCLES_MAX_1, CYCLES_MAX_2)
+#define CYCLES_MAX_4	(CYCLES_MAX_3 / 2 + CYCLES_MAX_3 / 4)
+#define CYCLES_MAX	(CYCLES_MAX_4 + LSB_GET(CYCLES_MAX_4))
 
 static struct k_spinlock lock;
 static uint64_t last_count;
@@ -170,27 +196,19 @@
 		return;
 	}
 
-	if (ticks == K_TICKS_FOREVER) {
-		set_mtimecmp(UINT64_MAX);
-		return;
-	}
-
-	/*
-	 * Clamp the max period length to a number of cycles that can fit
-	 * in half the range of a cycle_diff_t for native width divisions
-	 * to be usable elsewhere. Also clamp it to half the range of an
-	 * int32_t as this is the type used for elapsed tick announcements.
-	 * The half range gives us extra room to cope with the unavoidable IRQ
-	 * servicing latency. The compiler should optimize away the least
-	 * restrictive of those tests automatically.
-	 */
-	ticks = CLAMP(ticks, 0, (cycle_diff_t)-1 / 2 / CYC_PER_TICK);
-	ticks = CLAMP(ticks, 0, INT32_MAX / 2);
-
 	k_spinlock_key_t key = k_spin_lock(&lock);
-	uint64_t cyc = (last_ticks + last_elapsed + ticks) * CYC_PER_TICK;
+	uint64_t cyc;
 
+	if (ticks == K_TICKS_FOREVER) {
+		cyc = last_count + CYCLES_MAX;
+	} else {
+		cyc = (last_ticks + last_elapsed + ticks) * CYC_PER_TICK;
+		if ((cyc - last_count) > CYCLES_MAX) {
+			cyc = last_count + CYCLES_MAX;
+		}
+	}
 	set_mtimecmp(cyc);
+
 	k_spin_unlock(&lock, key);
 }
commit	0ea64b3ecb6438735d25e6490daa979e4c79dc3e	[log] [tgz]
author	Nicolas Pitre <npitre@baylibre.com>	Fri May 03 17:33:30 2024 -0400
committer	Anas Nashif <anas.nashif@intel.com>	Tue May 07 21:22:12 2024 -0400
tree	8678a437c2ac856b67d3181baaea202957944266
parent	3f07d4b6abb31d701506b5970e83ba5de5d509d2 [diff]