1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun * Copyright (c) 2012 Mellanox Technologies. All rights reserved.
3*4882a593Smuzhiyun *
4*4882a593Smuzhiyun * This software is available to you under a choice of one of two
5*4882a593Smuzhiyun * licenses. You may choose to be licensed under the terms of the GNU
6*4882a593Smuzhiyun * General Public License (GPL) Version 2, available from the file
7*4882a593Smuzhiyun * COPYING in the main directory of this source tree, or the
8*4882a593Smuzhiyun * OpenIB.org BSD license below:
9*4882a593Smuzhiyun *
10*4882a593Smuzhiyun * Redistribution and use in source and binary forms, with or
11*4882a593Smuzhiyun * without modification, are permitted provided that the following
12*4882a593Smuzhiyun * conditions are met:
13*4882a593Smuzhiyun *
14*4882a593Smuzhiyun * - Redistributions of source code must retain the above
15*4882a593Smuzhiyun * copyright notice, this list of conditions and the following
16*4882a593Smuzhiyun * disclaimer.
17*4882a593Smuzhiyun *
18*4882a593Smuzhiyun * - Redistributions in binary form must reproduce the above
19*4882a593Smuzhiyun * copyright notice, this list of conditions and the following
20*4882a593Smuzhiyun * disclaimer in the documentation and/or other materials
21*4882a593Smuzhiyun * provided with the distribution.
22*4882a593Smuzhiyun *
23*4882a593Smuzhiyun * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24*4882a593Smuzhiyun * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25*4882a593Smuzhiyun * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26*4882a593Smuzhiyun * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27*4882a593Smuzhiyun * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28*4882a593Smuzhiyun * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29*4882a593Smuzhiyun * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
30*4882a593Smuzhiyun * SOFTWARE.
31*4882a593Smuzhiyun *
32*4882a593Smuzhiyun */
33*4882a593Smuzhiyun
34*4882a593Smuzhiyun #include <linux/mlx4/device.h>
35*4882a593Smuzhiyun #include <linux/clocksource.h>
36*4882a593Smuzhiyun
37*4882a593Smuzhiyun #include "mlx4_en.h"
38*4882a593Smuzhiyun
39*4882a593Smuzhiyun /* mlx4_en_read_clock - read raw cycle counter (to be used by time counter)
40*4882a593Smuzhiyun */
mlx4_en_read_clock(const struct cyclecounter * tc)41*4882a593Smuzhiyun static u64 mlx4_en_read_clock(const struct cyclecounter *tc)
42*4882a593Smuzhiyun {
43*4882a593Smuzhiyun struct mlx4_en_dev *mdev =
44*4882a593Smuzhiyun container_of(tc, struct mlx4_en_dev, cycles);
45*4882a593Smuzhiyun struct mlx4_dev *dev = mdev->dev;
46*4882a593Smuzhiyun
47*4882a593Smuzhiyun return mlx4_read_clock(dev) & tc->mask;
48*4882a593Smuzhiyun }
49*4882a593Smuzhiyun
mlx4_en_get_cqe_ts(struct mlx4_cqe * cqe)50*4882a593Smuzhiyun u64 mlx4_en_get_cqe_ts(struct mlx4_cqe *cqe)
51*4882a593Smuzhiyun {
52*4882a593Smuzhiyun u64 hi, lo;
53*4882a593Smuzhiyun struct mlx4_ts_cqe *ts_cqe = (struct mlx4_ts_cqe *)cqe;
54*4882a593Smuzhiyun
55*4882a593Smuzhiyun lo = (u64)be16_to_cpu(ts_cqe->timestamp_lo);
56*4882a593Smuzhiyun hi = ((u64)be32_to_cpu(ts_cqe->timestamp_hi) + !lo) << 16;
57*4882a593Smuzhiyun
58*4882a593Smuzhiyun return hi | lo;
59*4882a593Smuzhiyun }
60*4882a593Smuzhiyun
mlx4_en_fill_hwtstamps(struct mlx4_en_dev * mdev,struct skb_shared_hwtstamps * hwts,u64 timestamp)61*4882a593Smuzhiyun void mlx4_en_fill_hwtstamps(struct mlx4_en_dev *mdev,
62*4882a593Smuzhiyun struct skb_shared_hwtstamps *hwts,
63*4882a593Smuzhiyun u64 timestamp)
64*4882a593Smuzhiyun {
65*4882a593Smuzhiyun unsigned int seq;
66*4882a593Smuzhiyun u64 nsec;
67*4882a593Smuzhiyun
68*4882a593Smuzhiyun do {
69*4882a593Smuzhiyun seq = read_seqbegin(&mdev->clock_lock);
70*4882a593Smuzhiyun nsec = timecounter_cyc2time(&mdev->clock, timestamp);
71*4882a593Smuzhiyun } while (read_seqretry(&mdev->clock_lock, seq));
72*4882a593Smuzhiyun
73*4882a593Smuzhiyun memset(hwts, 0, sizeof(struct skb_shared_hwtstamps));
74*4882a593Smuzhiyun hwts->hwtstamp = ns_to_ktime(nsec);
75*4882a593Smuzhiyun }
76*4882a593Smuzhiyun
77*4882a593Smuzhiyun /**
78*4882a593Smuzhiyun * mlx4_en_remove_timestamp - disable PTP device
79*4882a593Smuzhiyun * @mdev: board private structure
80*4882a593Smuzhiyun *
81*4882a593Smuzhiyun * Stop the PTP support.
82*4882a593Smuzhiyun **/
mlx4_en_remove_timestamp(struct mlx4_en_dev * mdev)83*4882a593Smuzhiyun void mlx4_en_remove_timestamp(struct mlx4_en_dev *mdev)
84*4882a593Smuzhiyun {
85*4882a593Smuzhiyun if (mdev->ptp_clock) {
86*4882a593Smuzhiyun ptp_clock_unregister(mdev->ptp_clock);
87*4882a593Smuzhiyun mdev->ptp_clock = NULL;
88*4882a593Smuzhiyun mlx4_info(mdev, "removed PHC\n");
89*4882a593Smuzhiyun }
90*4882a593Smuzhiyun }
91*4882a593Smuzhiyun
92*4882a593Smuzhiyun #define MLX4_EN_WRAP_AROUND_SEC 10UL
93*4882a593Smuzhiyun /* By scheduling the overflow check every 5 seconds, we have a reasonably
94*4882a593Smuzhiyun * good chance we wont miss a wrap around.
95*4882a593Smuzhiyun * TOTO: Use a timer instead of a work queue to increase the guarantee.
96*4882a593Smuzhiyun */
97*4882a593Smuzhiyun #define MLX4_EN_OVERFLOW_PERIOD (MLX4_EN_WRAP_AROUND_SEC * HZ / 2)
98*4882a593Smuzhiyun
mlx4_en_ptp_overflow_check(struct mlx4_en_dev * mdev)99*4882a593Smuzhiyun void mlx4_en_ptp_overflow_check(struct mlx4_en_dev *mdev)
100*4882a593Smuzhiyun {
101*4882a593Smuzhiyun bool timeout = time_is_before_jiffies(mdev->last_overflow_check +
102*4882a593Smuzhiyun MLX4_EN_OVERFLOW_PERIOD);
103*4882a593Smuzhiyun unsigned long flags;
104*4882a593Smuzhiyun
105*4882a593Smuzhiyun if (timeout) {
106*4882a593Smuzhiyun write_seqlock_irqsave(&mdev->clock_lock, flags);
107*4882a593Smuzhiyun timecounter_read(&mdev->clock);
108*4882a593Smuzhiyun write_sequnlock_irqrestore(&mdev->clock_lock, flags);
109*4882a593Smuzhiyun mdev->last_overflow_check = jiffies;
110*4882a593Smuzhiyun }
111*4882a593Smuzhiyun }
112*4882a593Smuzhiyun
113*4882a593Smuzhiyun /**
114*4882a593Smuzhiyun * mlx4_en_phc_adjfreq - adjust the frequency of the hardware clock
115*4882a593Smuzhiyun * @ptp: ptp clock structure
116*4882a593Smuzhiyun * @delta: Desired frequency change in parts per billion
117*4882a593Smuzhiyun *
118*4882a593Smuzhiyun * Adjust the frequency of the PHC cycle counter by the indicated delta from
119*4882a593Smuzhiyun * the base frequency.
120*4882a593Smuzhiyun **/
mlx4_en_phc_adjfreq(struct ptp_clock_info * ptp,s32 delta)121*4882a593Smuzhiyun static int mlx4_en_phc_adjfreq(struct ptp_clock_info *ptp, s32 delta)
122*4882a593Smuzhiyun {
123*4882a593Smuzhiyun u64 adj;
124*4882a593Smuzhiyun u32 diff, mult;
125*4882a593Smuzhiyun int neg_adj = 0;
126*4882a593Smuzhiyun unsigned long flags;
127*4882a593Smuzhiyun struct mlx4_en_dev *mdev = container_of(ptp, struct mlx4_en_dev,
128*4882a593Smuzhiyun ptp_clock_info);
129*4882a593Smuzhiyun
130*4882a593Smuzhiyun if (delta < 0) {
131*4882a593Smuzhiyun neg_adj = 1;
132*4882a593Smuzhiyun delta = -delta;
133*4882a593Smuzhiyun }
134*4882a593Smuzhiyun mult = mdev->nominal_c_mult;
135*4882a593Smuzhiyun adj = mult;
136*4882a593Smuzhiyun adj *= delta;
137*4882a593Smuzhiyun diff = div_u64(adj, 1000000000ULL);
138*4882a593Smuzhiyun
139*4882a593Smuzhiyun write_seqlock_irqsave(&mdev->clock_lock, flags);
140*4882a593Smuzhiyun timecounter_read(&mdev->clock);
141*4882a593Smuzhiyun mdev->cycles.mult = neg_adj ? mult - diff : mult + diff;
142*4882a593Smuzhiyun write_sequnlock_irqrestore(&mdev->clock_lock, flags);
143*4882a593Smuzhiyun
144*4882a593Smuzhiyun return 0;
145*4882a593Smuzhiyun }
146*4882a593Smuzhiyun
147*4882a593Smuzhiyun /**
148*4882a593Smuzhiyun * mlx4_en_phc_adjtime - Shift the time of the hardware clock
149*4882a593Smuzhiyun * @ptp: ptp clock structure
150*4882a593Smuzhiyun * @delta: Desired change in nanoseconds
151*4882a593Smuzhiyun *
152*4882a593Smuzhiyun * Adjust the timer by resetting the timecounter structure.
153*4882a593Smuzhiyun **/
mlx4_en_phc_adjtime(struct ptp_clock_info * ptp,s64 delta)154*4882a593Smuzhiyun static int mlx4_en_phc_adjtime(struct ptp_clock_info *ptp, s64 delta)
155*4882a593Smuzhiyun {
156*4882a593Smuzhiyun struct mlx4_en_dev *mdev = container_of(ptp, struct mlx4_en_dev,
157*4882a593Smuzhiyun ptp_clock_info);
158*4882a593Smuzhiyun unsigned long flags;
159*4882a593Smuzhiyun
160*4882a593Smuzhiyun write_seqlock_irqsave(&mdev->clock_lock, flags);
161*4882a593Smuzhiyun timecounter_adjtime(&mdev->clock, delta);
162*4882a593Smuzhiyun write_sequnlock_irqrestore(&mdev->clock_lock, flags);
163*4882a593Smuzhiyun
164*4882a593Smuzhiyun return 0;
165*4882a593Smuzhiyun }
166*4882a593Smuzhiyun
167*4882a593Smuzhiyun /**
168*4882a593Smuzhiyun * mlx4_en_phc_gettime - Reads the current time from the hardware clock
169*4882a593Smuzhiyun * @ptp: ptp clock structure
170*4882a593Smuzhiyun * @ts: timespec structure to hold the current time value
171*4882a593Smuzhiyun *
172*4882a593Smuzhiyun * Read the timecounter and return the correct value in ns after converting
173*4882a593Smuzhiyun * it into a struct timespec.
174*4882a593Smuzhiyun **/
mlx4_en_phc_gettime(struct ptp_clock_info * ptp,struct timespec64 * ts)175*4882a593Smuzhiyun static int mlx4_en_phc_gettime(struct ptp_clock_info *ptp,
176*4882a593Smuzhiyun struct timespec64 *ts)
177*4882a593Smuzhiyun {
178*4882a593Smuzhiyun struct mlx4_en_dev *mdev = container_of(ptp, struct mlx4_en_dev,
179*4882a593Smuzhiyun ptp_clock_info);
180*4882a593Smuzhiyun unsigned long flags;
181*4882a593Smuzhiyun u64 ns;
182*4882a593Smuzhiyun
183*4882a593Smuzhiyun write_seqlock_irqsave(&mdev->clock_lock, flags);
184*4882a593Smuzhiyun ns = timecounter_read(&mdev->clock);
185*4882a593Smuzhiyun write_sequnlock_irqrestore(&mdev->clock_lock, flags);
186*4882a593Smuzhiyun
187*4882a593Smuzhiyun *ts = ns_to_timespec64(ns);
188*4882a593Smuzhiyun
189*4882a593Smuzhiyun return 0;
190*4882a593Smuzhiyun }
191*4882a593Smuzhiyun
192*4882a593Smuzhiyun /**
193*4882a593Smuzhiyun * mlx4_en_phc_settime - Set the current time on the hardware clock
194*4882a593Smuzhiyun * @ptp: ptp clock structure
195*4882a593Smuzhiyun * @ts: timespec containing the new time for the cycle counter
196*4882a593Smuzhiyun *
197*4882a593Smuzhiyun * Reset the timecounter to use a new base value instead of the kernel
198*4882a593Smuzhiyun * wall timer value.
199*4882a593Smuzhiyun **/
mlx4_en_phc_settime(struct ptp_clock_info * ptp,const struct timespec64 * ts)200*4882a593Smuzhiyun static int mlx4_en_phc_settime(struct ptp_clock_info *ptp,
201*4882a593Smuzhiyun const struct timespec64 *ts)
202*4882a593Smuzhiyun {
203*4882a593Smuzhiyun struct mlx4_en_dev *mdev = container_of(ptp, struct mlx4_en_dev,
204*4882a593Smuzhiyun ptp_clock_info);
205*4882a593Smuzhiyun u64 ns = timespec64_to_ns(ts);
206*4882a593Smuzhiyun unsigned long flags;
207*4882a593Smuzhiyun
208*4882a593Smuzhiyun /* reset the timecounter */
209*4882a593Smuzhiyun write_seqlock_irqsave(&mdev->clock_lock, flags);
210*4882a593Smuzhiyun timecounter_init(&mdev->clock, &mdev->cycles, ns);
211*4882a593Smuzhiyun write_sequnlock_irqrestore(&mdev->clock_lock, flags);
212*4882a593Smuzhiyun
213*4882a593Smuzhiyun return 0;
214*4882a593Smuzhiyun }
215*4882a593Smuzhiyun
216*4882a593Smuzhiyun /**
217*4882a593Smuzhiyun * mlx4_en_phc_enable - enable or disable an ancillary feature
218*4882a593Smuzhiyun * @ptp: ptp clock structure
219*4882a593Smuzhiyun * @request: Desired resource to enable or disable
220*4882a593Smuzhiyun * @on: Caller passes one to enable or zero to disable
221*4882a593Smuzhiyun *
222*4882a593Smuzhiyun * Enable (or disable) ancillary features of the PHC subsystem.
223*4882a593Smuzhiyun * Currently, no ancillary features are supported.
224*4882a593Smuzhiyun **/
mlx4_en_phc_enable(struct ptp_clock_info __always_unused * ptp,struct ptp_clock_request __always_unused * request,int __always_unused on)225*4882a593Smuzhiyun static int mlx4_en_phc_enable(struct ptp_clock_info __always_unused *ptp,
226*4882a593Smuzhiyun struct ptp_clock_request __always_unused *request,
227*4882a593Smuzhiyun int __always_unused on)
228*4882a593Smuzhiyun {
229*4882a593Smuzhiyun return -EOPNOTSUPP;
230*4882a593Smuzhiyun }
231*4882a593Smuzhiyun
232*4882a593Smuzhiyun static const struct ptp_clock_info mlx4_en_ptp_clock_info = {
233*4882a593Smuzhiyun .owner = THIS_MODULE,
234*4882a593Smuzhiyun .max_adj = 100000000,
235*4882a593Smuzhiyun .n_alarm = 0,
236*4882a593Smuzhiyun .n_ext_ts = 0,
237*4882a593Smuzhiyun .n_per_out = 0,
238*4882a593Smuzhiyun .n_pins = 0,
239*4882a593Smuzhiyun .pps = 0,
240*4882a593Smuzhiyun .adjfreq = mlx4_en_phc_adjfreq,
241*4882a593Smuzhiyun .adjtime = mlx4_en_phc_adjtime,
242*4882a593Smuzhiyun .gettime64 = mlx4_en_phc_gettime,
243*4882a593Smuzhiyun .settime64 = mlx4_en_phc_settime,
244*4882a593Smuzhiyun .enable = mlx4_en_phc_enable,
245*4882a593Smuzhiyun };
246*4882a593Smuzhiyun
247*4882a593Smuzhiyun
248*4882a593Smuzhiyun /* This function calculates the max shift that enables the user range
249*4882a593Smuzhiyun * of MLX4_EN_WRAP_AROUND_SEC values in the cycles register.
250*4882a593Smuzhiyun */
freq_to_shift(u16 freq)251*4882a593Smuzhiyun static u32 freq_to_shift(u16 freq)
252*4882a593Smuzhiyun {
253*4882a593Smuzhiyun u32 freq_khz = freq * 1000;
254*4882a593Smuzhiyun u64 max_val_cycles = freq_khz * 1000 * MLX4_EN_WRAP_AROUND_SEC;
255*4882a593Smuzhiyun u64 max_val_cycles_rounded = 1ULL << fls64(max_val_cycles - 1);
256*4882a593Smuzhiyun /* calculate max possible multiplier in order to fit in 64bit */
257*4882a593Smuzhiyun u64 max_mul = div64_u64(ULLONG_MAX, max_val_cycles_rounded);
258*4882a593Smuzhiyun
259*4882a593Smuzhiyun /* This comes from the reverse of clocksource_khz2mult */
260*4882a593Smuzhiyun return ilog2(div_u64(max_mul * freq_khz, 1000000));
261*4882a593Smuzhiyun }
262*4882a593Smuzhiyun
mlx4_en_init_timestamp(struct mlx4_en_dev * mdev)263*4882a593Smuzhiyun void mlx4_en_init_timestamp(struct mlx4_en_dev *mdev)
264*4882a593Smuzhiyun {
265*4882a593Smuzhiyun struct mlx4_dev *dev = mdev->dev;
266*4882a593Smuzhiyun unsigned long flags;
267*4882a593Smuzhiyun
268*4882a593Smuzhiyun /* mlx4_en_init_timestamp is called for each netdev.
269*4882a593Smuzhiyun * mdev->ptp_clock is common for all ports, skip initialization if
270*4882a593Smuzhiyun * was done for other port.
271*4882a593Smuzhiyun */
272*4882a593Smuzhiyun if (mdev->ptp_clock)
273*4882a593Smuzhiyun return;
274*4882a593Smuzhiyun
275*4882a593Smuzhiyun seqlock_init(&mdev->clock_lock);
276*4882a593Smuzhiyun
277*4882a593Smuzhiyun memset(&mdev->cycles, 0, sizeof(mdev->cycles));
278*4882a593Smuzhiyun mdev->cycles.read = mlx4_en_read_clock;
279*4882a593Smuzhiyun mdev->cycles.mask = CLOCKSOURCE_MASK(48);
280*4882a593Smuzhiyun mdev->cycles.shift = freq_to_shift(dev->caps.hca_core_clock);
281*4882a593Smuzhiyun mdev->cycles.mult =
282*4882a593Smuzhiyun clocksource_khz2mult(1000 * dev->caps.hca_core_clock, mdev->cycles.shift);
283*4882a593Smuzhiyun mdev->nominal_c_mult = mdev->cycles.mult;
284*4882a593Smuzhiyun
285*4882a593Smuzhiyun write_seqlock_irqsave(&mdev->clock_lock, flags);
286*4882a593Smuzhiyun timecounter_init(&mdev->clock, &mdev->cycles,
287*4882a593Smuzhiyun ktime_to_ns(ktime_get_real()));
288*4882a593Smuzhiyun write_sequnlock_irqrestore(&mdev->clock_lock, flags);
289*4882a593Smuzhiyun
290*4882a593Smuzhiyun /* Configure the PHC */
291*4882a593Smuzhiyun mdev->ptp_clock_info = mlx4_en_ptp_clock_info;
292*4882a593Smuzhiyun snprintf(mdev->ptp_clock_info.name, 16, "mlx4 ptp");
293*4882a593Smuzhiyun
294*4882a593Smuzhiyun mdev->ptp_clock = ptp_clock_register(&mdev->ptp_clock_info,
295*4882a593Smuzhiyun &mdev->pdev->dev);
296*4882a593Smuzhiyun if (IS_ERR(mdev->ptp_clock)) {
297*4882a593Smuzhiyun mdev->ptp_clock = NULL;
298*4882a593Smuzhiyun mlx4_err(mdev, "ptp_clock_register failed\n");
299*4882a593Smuzhiyun } else if (mdev->ptp_clock) {
300*4882a593Smuzhiyun mlx4_info(mdev, "registered PHC clock\n");
301*4882a593Smuzhiyun }
302*4882a593Smuzhiyun
303*4882a593Smuzhiyun }
304