- 
                Notifications
    You must be signed in to change notification settings 
- Fork 6
dwt: copy DWT management and profiling features from stm32f4xx-hal (#50) #61
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
          
     Merged
      
        
      
    
  
     Merged
                    Changes from 1 commit
      Commits
    
    
            Show all changes
          
          
            2 commits
          
        
        Select commit
          Hold shift + click to select a range
      
      
    File filter
Filter by extension
Conversations
          Failed to load comments.   
        
        
          
      Loading
        
  Jump to
        
          Jump to file
        
      
      
          Failed to load files.   
        
        
          
      Loading
        
  Diff view
Diff view
There are no files selected for viewing
  
    
      This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
      Learn more about bidirectional Unicode characters
    
  
  
    
              | Original file line number | Diff line number | Diff line change | 
|---|---|---|
| @@ -0,0 +1,73 @@ | ||
| #![deny(unsafe_code)] | ||
| #![deny(warnings)] | ||
| #![no_main] | ||
| #![no_std] | ||
|  | ||
| mod utilities; | ||
|  | ||
| use cortex_m_rt::entry; | ||
| use embedded_hal::delay::DelayNs; | ||
| use log::info; | ||
| use stm32h5xx_hal::{ | ||
| dwt::{ClockDuration, DwtExt}, | ||
| pac, | ||
| prelude::*, | ||
| }; | ||
|  | ||
| #[entry] | ||
| fn main() -> ! { | ||
| utilities::logger::init(); | ||
|  | ||
| let cp = cortex_m::Peripherals::take().unwrap(); | ||
| let dp = pac::Peripherals::take().unwrap(); | ||
|  | ||
| info!("Setup PWR... "); | ||
| let pwr = dp.PWR.constrain(); | ||
| let pwrcfg = pwr.vos0().freeze(); | ||
|  | ||
| // Constrain and Freeze clock | ||
| info!("Setup RCC... "); | ||
| let rcc = dp.RCC.constrain(); | ||
| let ccdr = rcc.sys_ck(250.MHz()).freeze(pwrcfg, &dp.SBS); | ||
|  | ||
| let gpioa = dp.GPIOA.split(ccdr.peripheral.GPIOA); | ||
| let mut led = gpioa.pa5.into_push_pull_output(); | ||
|  | ||
| // Create a delay abstraction based on DWT cycle counter | ||
| let dwt = cp.DWT.constrain(cp.DCB, &ccdr.clocks); | ||
| let mut delay = dwt.delay(); | ||
|  | ||
| // Create a stopwatch for maximum 9 laps | ||
| // Note: it starts immediately | ||
| let mut lap_times = [0u32; 10]; | ||
| let mut sw = dwt.stopwatch(&mut lap_times); | ||
| loop { | ||
| // On for 1s, off for 1s. | ||
| led.set_high(); | ||
| delay.delay_ms(1000); | ||
| sw.lap(); | ||
| led.set_low(); | ||
| delay.delay_ms(900); | ||
|  | ||
| // Also you can measure with almost clock precision | ||
| let cd: ClockDuration = dwt.measure(|| delay.delay_ms(100)); | ||
| info!("Ticks: {}", cd.as_ticks()); // Should return 250MHz * 0.1s as u32 | ||
| info!("Secs (f32): {}", cd.as_secs_f32()); // Should return ~0.1s as a f32 | ||
| info!("Secs (f64): {}", cd.as_secs_f64()); // Should return ~0.1s as a f64 | ||
| info!("Nanos: {}", cd.as_nanos()); // Should return 100000000ns as a u64 | ||
|  | ||
| sw.lap(); | ||
|  | ||
| // Get all the lap times | ||
| { | ||
| let mut lap = 1; | ||
| while let Some(lap_time) = sw.lap_time(lap) { | ||
| let _t = lap_time.as_secs_f64(); | ||
| lap += 1; | ||
| } | ||
| } | ||
|  | ||
| // Reset stopwatch | ||
| sw.reset(); | ||
| } | ||
| } | 
  
    
      This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
      Learn more about bidirectional Unicode characters
    
  
  
    
              | Original file line number | Diff line number | Diff line change | 
|---|---|---|
| @@ -0,0 +1,267 @@ | ||
| //! Debug and trace management for profiling/tracing operations | ||
| //! This module provides an interface for using the DWT (Data Watchpoint and Trace) | ||
| //! unit on Cortex-M microcontrollers, allowing for cycle counting and tracing | ||
| //! of code execution. | ||
|  | ||
| use cortex_m::peripheral::{DCB, DWT}; | ||
| use fugit::HertzU32 as Hertz; | ||
|  | ||
| use crate::rcc::CoreClocks; | ||
|  | ||
| pub trait DwtExt { | ||
| fn constrain(self, dcb: DCB, clocks: &CoreClocks) -> Dwt; | ||
| } | ||
| impl DwtExt for DWT { | ||
| /// Enable trace unit and cycle counter | ||
| fn constrain(mut self, mut dcb: DCB, clocks: &CoreClocks) -> Dwt { | ||
| dcb.enable_trace(); | ||
| self.enable_cycle_counter(); | ||
| Dwt { | ||
| dwt: self, | ||
| dcb, | ||
| clock: clocks.hclk(), | ||
| } | ||
| } | ||
| } | ||
|  | ||
| /// DWT (Data Watchpoint and Trace) unit | ||
| pub struct Dwt { | ||
| dwt: DWT, | ||
| dcb: DCB, | ||
| clock: Hertz, | ||
| } | ||
| impl Dwt { | ||
| /// Release the dwt and dcb control | ||
| /// # Safety | ||
| /// All instances of Delay and StopWatch become invalid after this | ||
| pub unsafe fn release(self) -> (DWT, DCB) { | ||
| (self.dwt, self.dcb) | ||
| } | ||
| /// Create a delay instance | ||
| pub fn delay(&self) -> Delay { | ||
| Delay { clock: self.clock } | ||
| } | ||
| /// Create a stopwatch instance | ||
| /// # Arguments | ||
| /// * `times` - Array which will be holding the timings in ticks (max laps == times.len()-1) | ||
| pub fn stopwatch<'i>(&self, times: &'i mut [u32]) -> StopWatch<'i> { | ||
| StopWatch::new(times, self.clock) | ||
| } | ||
| /// Measure cycles it takes to execute closure `f`. | ||
| /// | ||
| /// Since DWT Cycle Counter is a 32-bit counter that wraps around to 0 on overflow, | ||
| /// users should be aware that `Dwt::measure` cannot correctly measure running time of | ||
| /// closures which take longer than `u32::MAX` cycles | ||
| pub fn measure<F: FnOnce()>(&self, f: F) -> ClockDuration { | ||
| let mut times: [u32; 2] = [0; 2]; | ||
| let mut sw = self.stopwatch(&mut times); | ||
| f(); | ||
| sw.lap().lap_time(1).unwrap() | ||
| } | ||
| } | ||
|  | ||
| #[derive(Clone, Copy)] | ||
| pub struct Delay { | ||
| clock: Hertz, | ||
| } | ||
| impl Delay { | ||
| /// Delay for `ClockDuration::ticks` | ||
| pub fn delay(duration: ClockDuration) { | ||
| let ticks = duration.ticks as u64; | ||
| Delay::delay_ticks(DWT::cycle_count(), ticks); | ||
| } | ||
| /// Delay ticks | ||
| /// NOTE DCB and DWT need to be set up for this to work, so it is private | ||
| fn delay_ticks(mut start: u32, ticks: u64) { | ||
| if ticks < (u32::MAX / 2) as u64 { | ||
| // Simple delay | ||
| let ticks = ticks as u32; | ||
| while (DWT::cycle_count().wrapping_sub(start)) < ticks {} | ||
| } else if ticks <= u32::MAX as u64 { | ||
| // Try to avoid race conditions by limiting delay to u32::MAX / 2 | ||
| let mut ticks = ticks as u32; | ||
| ticks -= u32::MAX / 2; | ||
| while (DWT::cycle_count().wrapping_sub(start)) < u32::MAX / 2 {} | ||
| start -= u32::MAX / 2; | ||
| while (DWT::cycle_count().wrapping_sub(start)) < ticks {} | ||
| } else { | ||
| // Delay for ticks, then delay for rest * u32::MAX | ||
| let mut rest = (ticks >> 32) as u32; | ||
| let ticks = (ticks & u32::MAX as u64) as u32; | ||
| loop { | ||
| while (DWT::cycle_count().wrapping_sub(start)) < ticks {} | ||
| if rest == 0 { | ||
| break; | ||
| } | ||
| rest -= 1; | ||
| while (DWT::cycle_count().wrapping_sub(start)) > ticks {} | ||
| } | ||
| } | ||
| } | ||
| } | ||
|  | ||
| impl embedded_hal::delay::DelayNs for Delay { | ||
| fn delay_ns(&mut self, ns: u32) { | ||
| // Convert us to ticks | ||
| let start = DWT::cycle_count(); | ||
| let ticks = (ns as u64 * self.clock.raw() as u64) / 1_000_000_000; | ||
| Delay::delay_ticks(start, ticks); | ||
| } | ||
|  | ||
| fn delay_us(&mut self, us: u32) { | ||
| // Convert us to ticks | ||
| let start = DWT::cycle_count(); | ||
| let ticks = (us as u64 * self.clock.raw() as u64) / 1_000_000; | ||
| Delay::delay_ticks(start, ticks); | ||
| } | ||
|  | ||
| fn delay_ms(&mut self, ms: u32) { | ||
| // Convert ms to ticks | ||
| let start = DWT::cycle_count(); | ||
| let ticks = (ms as u64 * self.clock.raw() as u64) / 1_000; | ||
| Delay::delay_ticks(start, ticks); | ||
| } | ||
| } | ||
|  | ||
| /// Very simple stopwatch which reads from DWT Cycle Counter to record timing. | ||
| /// | ||
| /// Since DWT Cycle Counter is a 32-bit counter that wraps around to 0 on overflow, | ||
| /// users should be aware that `StopWatch` cannot correctly measure laps | ||
| /// which take longer than `u32::MAX` cycles | ||
| pub struct StopWatch<'l> { | ||
| times: &'l mut [u32], | ||
| timei: usize, | ||
| clock: Hertz, | ||
| } | ||
| impl<'l> StopWatch<'l> { | ||
| /// Create a new instance (Private because dwt/dcb should be set up) | ||
| /// # Arguments | ||
| /// * `times` - Array which will be holding the timings (max laps == times.len()-1) | ||
| /// * `clock` - The DWT cycle counters clock | ||
| fn new(times: &'l mut [u32], clock: Hertz) -> Self { | ||
| assert!(times.len() >= 2); | ||
| let mut sw = StopWatch { | ||
| times, | ||
| timei: 0, | ||
| clock, | ||
| }; | ||
| sw.reset(); | ||
| sw | ||
| } | ||
| /// Returns the numbers of laps recorded | ||
| pub fn lap_count(&self) -> usize { | ||
| self.timei | ||
| } | ||
| /// Resets recorded laps to 0 and sets 0 offset | ||
| pub fn reset(&mut self) { | ||
| self.timei = 0; | ||
| self.times[0] = DWT::cycle_count(); | ||
| } | ||
| /// Record a new lap. | ||
| /// | ||
| /// If lap count exceeds maximum, the last lap is updated | ||
| pub fn lap(&mut self) -> &mut Self { | ||
| let c = DWT::cycle_count(); | ||
| if self.timei < self.times.len() { | ||
| self.timei += 1; | ||
| } | ||
| self.times[self.timei] = c; | ||
| self | ||
| } | ||
| /// Calculate the time of lap n (n starting with 1). | ||
| /// | ||
| /// Returns None if `n` is out of range | ||
| pub fn lap_time(&self, n: usize) -> Option<ClockDuration> { | ||
| if (n < 1) || (self.timei < n) { | ||
| None | ||
| } else { | ||
| Some(ClockDuration { | ||
| ticks: self.times[n].wrapping_sub(self.times[n - 1]), | ||
| clock: self.clock, | ||
| }) | ||
| } | ||
| } | ||
| } | ||
|  | ||
| /// Clock difference with capability to calculate SI units (s) | ||
| #[derive(Clone, Copy)] | ||
| pub struct ClockDuration { | ||
| ticks: u32, | ||
| clock: Hertz, | ||
| } | ||
| impl ClockDuration { | ||
| /// Returns ticks | ||
| pub fn as_ticks(self) -> u32 { | ||
| self.ticks | ||
| } | ||
| /// Returns calculated milliseconds as integer | ||
| pub fn as_millis(self) -> u64 { | ||
| self.ticks as u64 * 1_000 / self.clock.raw() as u64 | ||
| } | ||
| /// Returns calculated microseconds as integer | ||
| pub fn as_micros(self) -> u64 { | ||
| self.ticks as u64 * 1_000_000 / self.clock.raw() as u64 | ||
| } | ||
| /// Returns calculated nanoseconds as integer | ||
| pub fn as_nanos(self) -> u64 { | ||
| self.ticks as u64 * 1_000_000_000 / self.clock.raw() as u64 | ||
| } | ||
| /// Return calculated seconds as 32-bit float | ||
| pub fn as_secs_f32(self) -> f32 { | ||
| self.ticks as f32 / self.clock.raw() as f32 | ||
| } | ||
| /// Return calculated seconds as 64-bit float | ||
| pub fn as_secs_f64(self) -> f64 { | ||
| self.ticks as f64 / self.clock.raw() as f64 | ||
| } | ||
| } | ||
|  | ||
| /// A monotonic non-decreasing timer | ||
| /// | ||
| /// This uses the timer in the debug watch trace peripheral. This means, that if the | ||
| /// core is stopped, the timer does not count up. This may be relevant if you are using | ||
| /// cortex_m_semihosting::hprintln for debugging in which case the timer will be stopped | ||
| /// while printing | ||
| #[derive(Clone, Copy)] | ||
| pub struct MonoTimer { | ||
| frequency: Hertz, | ||
| } | ||
|  | ||
| impl MonoTimer { | ||
| /// Creates a new `Monotonic` timer | ||
| pub fn new(mut dwt: DWT, mut dcb: DCB, clocks: &CoreClocks) -> Self { | ||
| dcb.enable_trace(); | ||
| dwt.enable_cycle_counter(); | ||
|  | ||
| // now the CYCCNT counter can't be stopped or reset | ||
|  | ||
| MonoTimer { | ||
| frequency: clocks.hclk(), | ||
| } | ||
| } | ||
|  | ||
| /// Returns the frequency at which the monotonic timer is operating at | ||
| pub fn frequency(self) -> Hertz { | ||
| self.frequency | ||
| } | ||
|  | ||
| /// Returns an `Instant` corresponding to "now" | ||
| pub fn now(self) -> Instant { | ||
| Instant { | ||
| now: DWT::cycle_count(), | ||
| } | ||
| } | ||
| } | ||
|  | ||
| /// A measurement of a monotonically non-decreasing clock | ||
| #[derive(Clone, Copy)] | ||
| pub struct Instant { | ||
| now: u32, | ||
| } | ||
|  | ||
| impl Instant { | ||
| /// Ticks elapsed since the `Instant` was created | ||
| pub fn elapsed(self) -> u32 { | ||
| DWT::cycle_count().wrapping_sub(self.now) | ||
| } | ||
| } | ||
  
    
      This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
      Learn more about bidirectional Unicode characters
    
  
  
    
              
  
    
      This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
      Learn more about bidirectional Unicode characters
    
  
  
    
              
  Add this suggestion to a batch that can be applied as a single commit.
  This suggestion is invalid because no changes were made to the code.
  Suggestions cannot be applied while the pull request is closed.
  Suggestions cannot be applied while viewing a subset of changes.
  Only one suggestion per line can be applied in a batch.
  Add this suggestion to a batch that can be applied as a single commit.
  Applying suggestions on deleted lines is not supported.
  You must change the existing code in this line in order to create a valid suggestion.
  Outdated suggestions cannot be applied.
  This suggestion has been applied or marked resolved.
  Suggestions cannot be applied from pending reviews.
  Suggestions cannot be applied on multi-line comments.
  Suggestions cannot be applied while the pull request is queued to merge.
  Suggestion cannot be applied right now. Please check back later.
  
    
  
    
Uh oh!
There was an error while loading. Please reload this page.