]> Git Repo - linux.git/blobdiff - drivers/pwm/pwm-stm32.c
mfd: cros-ec: Increase maximum mkbp event size
[linux.git] / drivers / pwm / pwm-stm32.c
index 2708212933f72f077d2f23ef6b283a35c7bd0413..4f842550fbd127ce1b0f53522dfb7f4e60b74329 100644 (file)
@@ -8,6 +8,7 @@
  *             pwm-atmel.c from Bo Shen
  */
 
+#include <linux/bitfield.h>
 #include <linux/mfd/stm32-timers.h>
 #include <linux/module.h>
 #include <linux/of.h>
@@ -25,6 +26,7 @@ struct stm32_pwm {
        struct regmap *regmap;
        u32 max_arr;
        bool have_complementary_output;
+       u32 capture[4] ____cacheline_aligned; /* DMA'able buffer */
 };
 
 struct stm32_breakinput {
@@ -62,6 +64,258 @@ static int write_ccrx(struct stm32_pwm *dev, int ch, u32 value)
        return -EINVAL;
 }
 
+#define TIM_CCER_CC12P (TIM_CCER_CC1P | TIM_CCER_CC2P)
+#define TIM_CCER_CC12E (TIM_CCER_CC1E | TIM_CCER_CC2E)
+#define TIM_CCER_CC34P (TIM_CCER_CC3P | TIM_CCER_CC4P)
+#define TIM_CCER_CC34E (TIM_CCER_CC3E | TIM_CCER_CC4E)
+
+/*
+ * Capture using PWM input mode:
+ *                              ___          ___
+ * TI[1, 2, 3 or 4]: ........._|   |________|
+ *                             ^0  ^1       ^2
+ *                              .   .        .
+ *                              .   .        XXXXX
+ *                              .   .   XXXXX     |
+ *                              .  XXXXX     .    |
+ *                            XXXXX .        .    |
+ * COUNTER:        ______XXXXX  .   .        .    |_XXX
+ *                 start^       .   .        .        ^stop
+ *                      .       .   .        .
+ *                      v       v   .        v
+ *                                  v
+ * CCR1/CCR3:       tx..........t0...........t2
+ * CCR2/CCR4:       tx..............t1.........
+ *
+ * DMA burst transfer:          |            |
+ *                              v            v
+ * DMA buffer:                  { t0, tx }   { t2, t1 }
+ * DMA done:                                 ^
+ *
+ * 0: IC1/3 snapchot on rising edge: counter value -> CCR1/CCR3
+ *    + DMA transfer CCR[1/3] & CCR[2/4] values (t0, tx: doesn't care)
+ * 1: IC2/4 snapchot on falling edge: counter value -> CCR2/CCR4
+ * 2: IC1/3 snapchot on rising edge: counter value -> CCR1/CCR3
+ *    + DMA transfer CCR[1/3] & CCR[2/4] values (t2, t1)
+ *
+ * DMA done, compute:
+ * - Period     = t2 - t0
+ * - Duty cycle = t1 - t0
+ */
+static int stm32_pwm_raw_capture(struct stm32_pwm *priv, struct pwm_device *pwm,
+                                unsigned long tmo_ms, u32 *raw_prd,
+                                u32 *raw_dty)
+{
+       struct device *parent = priv->chip.dev->parent;
+       enum stm32_timers_dmas dma_id;
+       u32 ccen, ccr;
+       int ret;
+
+       /* Ensure registers have been updated, enable counter and capture */
+       regmap_update_bits(priv->regmap, TIM_EGR, TIM_EGR_UG, TIM_EGR_UG);
+       regmap_update_bits(priv->regmap, TIM_CR1, TIM_CR1_CEN, TIM_CR1_CEN);
+
+       /* Use cc1 or cc3 DMA resp for PWM input channels 1 & 2 or 3 & 4 */
+       dma_id = pwm->hwpwm < 2 ? STM32_TIMERS_DMA_CH1 : STM32_TIMERS_DMA_CH3;
+       ccen = pwm->hwpwm < 2 ? TIM_CCER_CC12E : TIM_CCER_CC34E;
+       ccr = pwm->hwpwm < 2 ? TIM_CCR1 : TIM_CCR3;
+       regmap_update_bits(priv->regmap, TIM_CCER, ccen, ccen);
+
+       /*
+        * Timer DMA burst mode. Request 2 registers, 2 bursts, to get both
+        * CCR1 & CCR2 (or CCR3 & CCR4) on each capture event.
+        * We'll get two capture snapchots: { CCR1, CCR2 }, { CCR1, CCR2 }
+        * or { CCR3, CCR4 }, { CCR3, CCR4 }
+        */
+       ret = stm32_timers_dma_burst_read(parent, priv->capture, dma_id, ccr, 2,
+                                         2, tmo_ms);
+       if (ret)
+               goto stop;
+
+       /* Period: t2 - t0 (take care of counter overflow) */
+       if (priv->capture[0] <= priv->capture[2])
+               *raw_prd = priv->capture[2] - priv->capture[0];
+       else
+               *raw_prd = priv->max_arr - priv->capture[0] + priv->capture[2];
+
+       /* Duty cycle capture requires at least two capture units */
+       if (pwm->chip->npwm < 2)
+               *raw_dty = 0;
+       else if (priv->capture[0] <= priv->capture[3])
+               *raw_dty = priv->capture[3] - priv->capture[0];
+       else
+               *raw_dty = priv->max_arr - priv->capture[0] + priv->capture[3];
+
+       if (*raw_dty > *raw_prd) {
+               /*
+                * Race beetween PWM input and DMA: it may happen
+                * falling edge triggers new capture on TI2/4 before DMA
+                * had a chance to read CCR2/4. It means capture[1]
+                * contains period + duty_cycle. So, subtract period.
+                */
+               *raw_dty -= *raw_prd;
+       }
+
+stop:
+       regmap_update_bits(priv->regmap, TIM_CCER, ccen, 0);
+       regmap_update_bits(priv->regmap, TIM_CR1, TIM_CR1_CEN, 0);
+
+       return ret;
+}
+
+static int stm32_pwm_capture(struct pwm_chip *chip, struct pwm_device *pwm,
+                            struct pwm_capture *result, unsigned long tmo_ms)
+{
+       struct stm32_pwm *priv = to_stm32_pwm_dev(chip);
+       unsigned long long prd, div, dty;
+       unsigned long rate;
+       unsigned int psc = 0, icpsc, scale;
+       u32 raw_prd = 0, raw_dty = 0;
+       int ret = 0;
+
+       mutex_lock(&priv->lock);
+
+       if (active_channels(priv)) {
+               ret = -EBUSY;
+               goto unlock;
+       }
+
+       ret = clk_enable(priv->clk);
+       if (ret) {
+               dev_err(priv->chip.dev, "failed to enable counter clock\n");
+               goto unlock;
+       }
+
+       rate = clk_get_rate(priv->clk);
+       if (!rate) {
+               ret = -EINVAL;
+               goto clk_dis;
+       }
+
+       /* prescaler: fit timeout window provided by upper layer */
+       div = (unsigned long long)rate * (unsigned long long)tmo_ms;
+       do_div(div, MSEC_PER_SEC);
+       prd = div;
+       while ((div > priv->max_arr) && (psc < MAX_TIM_PSC)) {
+               psc++;
+               div = prd;
+               do_div(div, psc + 1);
+       }
+       regmap_write(priv->regmap, TIM_ARR, priv->max_arr);
+       regmap_write(priv->regmap, TIM_PSC, psc);
+
+       /* Map TI1 or TI2 PWM input to IC1 & IC2 (or TI3/4 to IC3 & IC4) */
+       regmap_update_bits(priv->regmap,
+                          pwm->hwpwm < 2 ? TIM_CCMR1 : TIM_CCMR2,
+                          TIM_CCMR_CC1S | TIM_CCMR_CC2S, pwm->hwpwm & 0x1 ?
+                          TIM_CCMR_CC1S_TI2 | TIM_CCMR_CC2S_TI2 :
+                          TIM_CCMR_CC1S_TI1 | TIM_CCMR_CC2S_TI1);
+
+       /* Capture period on IC1/3 rising edge, duty cycle on IC2/4 falling. */
+       regmap_update_bits(priv->regmap, TIM_CCER, pwm->hwpwm < 2 ?
+                          TIM_CCER_CC12P : TIM_CCER_CC34P, pwm->hwpwm < 2 ?
+                          TIM_CCER_CC2P : TIM_CCER_CC4P);
+
+       ret = stm32_pwm_raw_capture(priv, pwm, tmo_ms, &raw_prd, &raw_dty);
+       if (ret)
+               goto stop;
+
+       /*
+        * Got a capture. Try to improve accuracy at high rates:
+        * - decrease counter clock prescaler, scale up to max rate.
+        * - use input prescaler, capture once every /2 /4 or /8 edges.
+        */
+       if (raw_prd) {
+               u32 max_arr = priv->max_arr - 0x1000; /* arbitrary margin */
+
+               scale = max_arr / min(max_arr, raw_prd);
+       } else {
+               scale = priv->max_arr; /* bellow resolution, use max scale */
+       }
+
+       if (psc && scale > 1) {
+               /* 2nd measure with new scale */
+               psc /= scale;
+               regmap_write(priv->regmap, TIM_PSC, psc);
+               ret = stm32_pwm_raw_capture(priv, pwm, tmo_ms, &raw_prd,
+                                           &raw_dty);
+               if (ret)
+                       goto stop;
+       }
+
+       /* Compute intermediate period not to exceed timeout at low rates */
+       prd = (unsigned long long)raw_prd * (psc + 1) * NSEC_PER_SEC;
+       do_div(prd, rate);
+
+       for (icpsc = 0; icpsc < MAX_TIM_ICPSC ; icpsc++) {
+               /* input prescaler: also keep arbitrary margin */
+               if (raw_prd >= (priv->max_arr - 0x1000) >> (icpsc + 1))
+                       break;
+               if (prd >= (tmo_ms * NSEC_PER_MSEC) >> (icpsc + 2))
+                       break;
+       }
+
+       if (!icpsc)
+               goto done;
+
+       /* Last chance to improve period accuracy, using input prescaler */
+       regmap_update_bits(priv->regmap,
+                          pwm->hwpwm < 2 ? TIM_CCMR1 : TIM_CCMR2,
+                          TIM_CCMR_IC1PSC | TIM_CCMR_IC2PSC,
+                          FIELD_PREP(TIM_CCMR_IC1PSC, icpsc) |
+                          FIELD_PREP(TIM_CCMR_IC2PSC, icpsc));
+
+       ret = stm32_pwm_raw_capture(priv, pwm, tmo_ms, &raw_prd, &raw_dty);
+       if (ret)
+               goto stop;
+
+       if (raw_dty >= (raw_prd >> icpsc)) {
+               /*
+                * We may fall here using input prescaler, when input
+                * capture starts on high side (before falling edge).
+                * Example with icpsc to capture on each 4 events:
+                *
+                *       start   1st capture                     2nd capture
+                *         v     v                               v
+                *         ___   _____   _____   _____   _____   ____
+                * TI1..4     |__|    |__|    |__|    |__|    |__|
+                *            v  v    .  .    .  .    .       v  v
+                * icpsc1/3:  .  0    .  1    .  2    .  3    .  0
+                * icpsc2/4:  0       1       2       3       0
+                *            v  v                            v  v
+                * CCR1/3  ......t0..............................t2
+                * CCR2/4  ..t1..............................t1'...
+                *               .                            .  .
+                * Capture0:     .<----------------------------->.
+                * Capture1:     .<-------------------------->.  .
+                *               .                            .  .
+                * Period:       .<------>                    .  .
+                * Low side:                                  .<>.
+                *
+                * Result:
+                * - Period = Capture0 / icpsc
+                * - Duty = Period - Low side = Period - (Capture0 - Capture1)
+                */
+               raw_dty = (raw_prd >> icpsc) - (raw_prd - raw_dty);
+       }
+
+done:
+       prd = (unsigned long long)raw_prd * (psc + 1) * NSEC_PER_SEC;
+       result->period = DIV_ROUND_UP_ULL(prd, rate << icpsc);
+       dty = (unsigned long long)raw_dty * (psc + 1) * NSEC_PER_SEC;
+       result->duty_cycle = DIV_ROUND_UP_ULL(dty, rate);
+stop:
+       regmap_write(priv->regmap, TIM_CCER, 0);
+       regmap_write(priv->regmap, pwm->hwpwm < 2 ? TIM_CCMR1 : TIM_CCMR2, 0);
+       regmap_write(priv->regmap, TIM_PSC, 0);
+clk_dis:
+       clk_disable(priv->clk);
+unlock:
+       mutex_unlock(&priv->lock);
+
+       return ret;
+}
+
 static int stm32_pwm_config(struct stm32_pwm *priv, int ch,
                            int duty_ns, int period_ns)
 {
@@ -230,6 +484,7 @@ static int stm32_pwm_apply_locked(struct pwm_chip *chip, struct pwm_device *pwm,
 static const struct pwm_ops stm32pwm_ops = {
        .owner = THIS_MODULE,
        .apply = stm32_pwm_apply_locked,
+       .capture = IS_ENABLED(CONFIG_DMA_ENGINE) ? stm32_pwm_capture : NULL,
 };
 
 static int stm32_pwm_set_breakinput(struct stm32_pwm *priv,
This page took 0.038925 seconds and 4 git commands to generate.