fbdev: Garbage collect fbdev scrolling acceleration, part 1 (from TODO list)
[linux-2.6-microblaze.git] / sound / firewire / motu / amdtp-motu.c
1 // SPDX-License-Identifier: GPL-2.0-only
2 /*
3  * amdtp-motu.c - a part of driver for MOTU FireWire series
4  *
5  * Copyright (c) 2015-2017 Takashi Sakamoto <o-takashi@sakamocchi.jp>
6  */
7
8 #include <linux/slab.h>
9 #include <sound/pcm.h>
10 #include "motu.h"
11
12 #define CREATE_TRACE_POINTS
13 #include "amdtp-motu-trace.h"
14
15 #define CIP_FMT_MOTU            0x02
16 #define CIP_FMT_MOTU_TX_V3      0x22
17 #define MOTU_FDF_AM824          0x22
18
19 #define TICKS_PER_CYCLE         3072
20 #define CYCLES_PER_SECOND       8000
21 #define TICKS_PER_SECOND        (TICKS_PER_CYCLE * CYCLES_PER_SECOND)
22
23 #define CIP_SPH_CYCLE_SHIFT     12
24 #define CIP_SPH_CYCLE_MASK      0x01fff000
25 #define CIP_SPH_OFFSET_MASK     0x00000fff
26
27 /*
28  * Nominally 3125 bytes/second, but the MIDI port's clock might be
29  * 1% too slow, and the bus clock 100 ppm too fast.
30  */
31 #define MIDI_BYTES_PER_SECOND   3093
32
33 struct amdtp_motu {
34         unsigned int pcm_chunks;
35         unsigned int pcm_byte_offset;
36
37         struct snd_rawmidi_substream *midi;
38         unsigned int midi_ports;
39         unsigned int midi_flag_offset;
40         unsigned int midi_byte_offset;
41
42         int midi_db_count;
43         unsigned int midi_db_interval;
44
45         struct amdtp_motu_cache *cache;
46 };
47
48 int amdtp_motu_set_parameters(struct amdtp_stream *s, unsigned int rate,
49                               unsigned int midi_ports,
50                               struct snd_motu_packet_format *formats)
51 {
52         struct amdtp_motu *p = s->protocol;
53         unsigned int pcm_chunks, data_chunks, data_block_quadlets;
54         unsigned int mode;
55         int i, err;
56
57         if (amdtp_stream_running(s))
58                 return -EBUSY;
59
60         for (i = 0; i < ARRAY_SIZE(snd_motu_clock_rates); ++i) {
61                 if (snd_motu_clock_rates[i] == rate) {
62                         mode = i >> 1;
63                         break;
64                 }
65         }
66         if (i == ARRAY_SIZE(snd_motu_clock_rates))
67                 return -EINVAL;
68
69         // Each data block includes SPH in its head. Data chunks follow with
70         // 3 byte alignment. Padding follows with zero to conform to quadlet
71         // alignment.
72         pcm_chunks = formats->pcm_chunks[mode];
73         data_chunks = formats->msg_chunks + pcm_chunks;
74         data_block_quadlets = 1 + DIV_ROUND_UP(data_chunks * 3, 4);
75
76         err = amdtp_stream_set_parameters(s, rate, data_block_quadlets);
77         if (err < 0)
78                 return err;
79
80         p->pcm_chunks = pcm_chunks;
81         p->pcm_byte_offset = formats->pcm_byte_offset;
82
83         p->midi_ports = midi_ports;
84         p->midi_flag_offset = formats->midi_flag_offset;
85         p->midi_byte_offset = formats->midi_byte_offset;
86
87         p->midi_db_count = 0;
88         p->midi_db_interval = rate / MIDI_BYTES_PER_SECOND;
89
90         return 0;
91 }
92
93 static void read_pcm_s32(struct amdtp_stream *s, struct snd_pcm_substream *pcm,
94                          __be32 *buffer, unsigned int data_blocks,
95                          unsigned int pcm_frames)
96 {
97         struct amdtp_motu *p = s->protocol;
98         unsigned int channels = p->pcm_chunks;
99         struct snd_pcm_runtime *runtime = pcm->runtime;
100         unsigned int pcm_buffer_pointer;
101         int remaining_frames;
102         u8 *byte;
103         u32 *dst;
104         int i, c;
105
106         pcm_buffer_pointer = s->pcm_buffer_pointer + pcm_frames;
107         pcm_buffer_pointer %= runtime->buffer_size;
108
109         dst = (void *)runtime->dma_area +
110                                 frames_to_bytes(runtime, pcm_buffer_pointer);
111         remaining_frames = runtime->buffer_size - pcm_buffer_pointer;
112
113         for (i = 0; i < data_blocks; ++i) {
114                 byte = (u8 *)buffer + p->pcm_byte_offset;
115
116                 for (c = 0; c < channels; ++c) {
117                         *dst = (byte[0] << 24) |
118                                (byte[1] << 16) |
119                                (byte[2] << 8);
120                         byte += 3;
121                         dst++;
122                 }
123                 buffer += s->data_block_quadlets;
124                 if (--remaining_frames == 0)
125                         dst = (void *)runtime->dma_area;
126         }
127 }
128
129 static void write_pcm_s32(struct amdtp_stream *s, struct snd_pcm_substream *pcm,
130                           __be32 *buffer, unsigned int data_blocks,
131                           unsigned int pcm_frames)
132 {
133         struct amdtp_motu *p = s->protocol;
134         unsigned int channels = p->pcm_chunks;
135         struct snd_pcm_runtime *runtime = pcm->runtime;
136         unsigned int pcm_buffer_pointer;
137         int remaining_frames;
138         u8 *byte;
139         const u32 *src;
140         int i, c;
141
142         pcm_buffer_pointer = s->pcm_buffer_pointer + pcm_frames;
143         pcm_buffer_pointer %= runtime->buffer_size;
144
145         src = (void *)runtime->dma_area +
146                                 frames_to_bytes(runtime, pcm_buffer_pointer);
147         remaining_frames = runtime->buffer_size - pcm_buffer_pointer;
148
149         for (i = 0; i < data_blocks; ++i) {
150                 byte = (u8 *)buffer + p->pcm_byte_offset;
151
152                 for (c = 0; c < channels; ++c) {
153                         byte[0] = (*src >> 24) & 0xff;
154                         byte[1] = (*src >> 16) & 0xff;
155                         byte[2] = (*src >>  8) & 0xff;
156                         byte += 3;
157                         src++;
158                 }
159
160                 buffer += s->data_block_quadlets;
161                 if (--remaining_frames == 0)
162                         src = (void *)runtime->dma_area;
163         }
164 }
165
166 static void write_pcm_silence(struct amdtp_stream *s, __be32 *buffer,
167                               unsigned int data_blocks)
168 {
169         struct amdtp_motu *p = s->protocol;
170         unsigned int channels, i, c;
171         u8 *byte;
172
173         channels = p->pcm_chunks;
174
175         for (i = 0; i < data_blocks; ++i) {
176                 byte = (u8 *)buffer + p->pcm_byte_offset;
177
178                 for (c = 0; c < channels; ++c) {
179                         byte[0] = 0;
180                         byte[1] = 0;
181                         byte[2] = 0;
182                         byte += 3;
183                 }
184
185                 buffer += s->data_block_quadlets;
186         }
187 }
188
189 int amdtp_motu_add_pcm_hw_constraints(struct amdtp_stream *s,
190                                       struct snd_pcm_runtime *runtime)
191 {
192         int err;
193
194         /* TODO: how to set an constraint for exactly 24bit PCM sample? */
195         err = snd_pcm_hw_constraint_msbits(runtime, 0, 32, 24);
196         if (err < 0)
197                 return err;
198
199         return amdtp_stream_add_pcm_hw_constraints(s, runtime);
200 }
201
202 void amdtp_motu_midi_trigger(struct amdtp_stream *s, unsigned int port,
203                              struct snd_rawmidi_substream *midi)
204 {
205         struct amdtp_motu *p = s->protocol;
206
207         if (port < p->midi_ports)
208                 WRITE_ONCE(p->midi, midi);
209 }
210
211 static void write_midi_messages(struct amdtp_stream *s, __be32 *buffer,
212                                 unsigned int data_blocks)
213 {
214         struct amdtp_motu *p = s->protocol;
215         struct snd_rawmidi_substream *midi = READ_ONCE(p->midi);
216         u8 *b;
217         int i;
218
219         for (i = 0; i < data_blocks; i++) {
220                 b = (u8 *)buffer;
221
222                 if (midi && p->midi_db_count == 0 &&
223                     snd_rawmidi_transmit(midi, b + p->midi_byte_offset, 1) == 1) {
224                         b[p->midi_flag_offset] = 0x01;
225                 } else {
226                         b[p->midi_byte_offset] = 0x00;
227                         b[p->midi_flag_offset] = 0x00;
228                 }
229
230                 buffer += s->data_block_quadlets;
231
232                 if (--p->midi_db_count < 0)
233                         p->midi_db_count = p->midi_db_interval;
234         }
235 }
236
237 static void read_midi_messages(struct amdtp_stream *s, __be32 *buffer,
238                                unsigned int data_blocks)
239 {
240         struct amdtp_motu *p = s->protocol;
241         struct snd_rawmidi_substream *midi;
242         u8 *b;
243         int i;
244
245         for (i = 0; i < data_blocks; i++) {
246                 b = (u8 *)buffer;
247                 midi = READ_ONCE(p->midi);
248
249                 if (midi && (b[p->midi_flag_offset] & 0x01))
250                         snd_rawmidi_receive(midi, b + p->midi_byte_offset, 1);
251
252                 buffer += s->data_block_quadlets;
253         }
254 }
255
256 /* For tracepoints. */
257 static void __maybe_unused copy_sph(u32 *frames, __be32 *buffer,
258                                     unsigned int data_blocks,
259                                     unsigned int data_block_quadlets)
260 {
261         unsigned int i;
262
263         for (i = 0; i < data_blocks; ++i) {
264                 *frames = be32_to_cpu(*buffer);
265                 buffer += data_block_quadlets;
266                 frames++;
267         }
268 }
269
270 /* For tracepoints. */
271 static void __maybe_unused copy_message(u64 *frames, __be32 *buffer,
272                                         unsigned int data_blocks,
273                                         unsigned int data_block_quadlets)
274 {
275         unsigned int i;
276
277         /* This is just for v2/v3 protocol. */
278         for (i = 0; i < data_blocks; ++i) {
279                 *frames = (be32_to_cpu(buffer[1]) << 16) |
280                           (be32_to_cpu(buffer[2]) >> 16);
281                 buffer += data_block_quadlets;
282                 frames++;
283         }
284 }
285
286 static void probe_tracepoints_events(struct amdtp_stream *s,
287                                      const struct pkt_desc *descs,
288                                      unsigned int packets)
289 {
290         int i;
291
292         for (i = 0; i < packets; ++i) {
293                 const struct pkt_desc *desc = descs + i;
294                 __be32 *buf = desc->ctx_payload;
295                 unsigned int data_blocks = desc->data_blocks;
296
297                 trace_data_block_sph(s, data_blocks, buf);
298                 trace_data_block_message(s, data_blocks, buf);
299         }
300 }
301
302 static void cache_event_offsets(struct amdtp_motu_cache *cache, const __be32 *buf,
303                                 unsigned int data_blocks, unsigned int data_block_quadlets)
304 {
305         unsigned int *event_offsets = cache->event_offsets;
306         const unsigned int cache_size = cache->size;
307         unsigned int cache_tail = cache->tail;
308         unsigned int base_tick = cache->tx_cycle_count * TICKS_PER_CYCLE;
309         int i;
310
311         for (i = 0; i < data_blocks; ++i) {
312                 u32 sph = be32_to_cpu(*buf);
313                 unsigned int tick;
314
315                 tick = ((sph & CIP_SPH_CYCLE_MASK) >> CIP_SPH_CYCLE_SHIFT) * TICKS_PER_CYCLE +
316                        (sph & CIP_SPH_OFFSET_MASK);
317
318                 if (tick < base_tick)
319                         tick += TICKS_PER_SECOND;
320                 event_offsets[cache_tail] = tick - base_tick;
321
322                 cache_tail = (cache_tail + 1) % cache_size;
323                 buf += data_block_quadlets;
324         }
325
326         cache->tail = cache_tail;
327         cache->tx_cycle_count = (cache->tx_cycle_count + 1) % CYCLES_PER_SECOND;
328 }
329
330 static unsigned int process_ir_ctx_payloads(struct amdtp_stream *s,
331                                             const struct pkt_desc *descs,
332                                             unsigned int packets,
333                                             struct snd_pcm_substream *pcm)
334 {
335         struct amdtp_motu *p = s->protocol;
336         unsigned int pcm_frames = 0;
337         int i;
338
339         if (p->cache->tx_cycle_count == UINT_MAX)
340                 p->cache->tx_cycle_count = (s->domain->processing_cycle.tx_start % CYCLES_PER_SECOND);
341
342         // For data block processing.
343         for (i = 0; i < packets; ++i) {
344                 const struct pkt_desc *desc = descs + i;
345                 __be32 *buf = desc->ctx_payload;
346                 unsigned int data_blocks = desc->data_blocks;
347
348                 cache_event_offsets(p->cache, buf, data_blocks, s->data_block_quadlets);
349
350                 if (pcm) {
351                         read_pcm_s32(s, pcm, buf, data_blocks, pcm_frames);
352                         pcm_frames += data_blocks;
353                 }
354
355                 if (p->midi_ports)
356                         read_midi_messages(s, buf, data_blocks);
357         }
358
359         // For tracepoints.
360         if (trace_data_block_sph_enabled() ||
361             trace_data_block_message_enabled())
362                 probe_tracepoints_events(s, descs, packets);
363
364         return pcm_frames;
365 }
366
367 static void write_sph(struct amdtp_motu_cache *cache, __be32 *buffer, unsigned int data_blocks,
368                       unsigned int data_block_quadlets)
369 {
370         unsigned int *event_offsets = cache->event_offsets;
371         const unsigned int cache_size = cache->size;
372         unsigned int cache_head = cache->head;
373         unsigned int base_tick = cache->rx_cycle_count * TICKS_PER_CYCLE;
374         int i;
375
376         for (i = 0; i < data_blocks; i++) {
377                 unsigned int tick = (base_tick + event_offsets[cache_head]) % TICKS_PER_SECOND;
378                 u32 sph = ((tick / TICKS_PER_CYCLE) << CIP_SPH_CYCLE_SHIFT) | (tick % TICKS_PER_CYCLE);
379                 *buffer = cpu_to_be32(sph);
380
381                 cache_head = (cache_head + 1) % cache_size;
382                 buffer += data_block_quadlets;
383         }
384
385         cache->head = cache_head;
386         cache->rx_cycle_count = (cache->rx_cycle_count + 1) % CYCLES_PER_SECOND;
387 }
388
389 static unsigned int process_it_ctx_payloads(struct amdtp_stream *s,
390                                             const struct pkt_desc *descs,
391                                             unsigned int packets,
392                                             struct snd_pcm_substream *pcm)
393 {
394         struct amdtp_motu *p = s->protocol;
395         unsigned int pcm_frames = 0;
396         int i;
397
398         if (p->cache->rx_cycle_count == UINT_MAX)
399                 p->cache->rx_cycle_count = (s->domain->processing_cycle.rx_start % CYCLES_PER_SECOND);
400
401         // For data block processing.
402         for (i = 0; i < packets; ++i) {
403                 const struct pkt_desc *desc = descs + i;
404                 __be32 *buf = desc->ctx_payload;
405                 unsigned int data_blocks = desc->data_blocks;
406
407                 if (pcm) {
408                         write_pcm_s32(s, pcm, buf, data_blocks, pcm_frames);
409                         pcm_frames += data_blocks;
410                 } else {
411                         write_pcm_silence(s, buf, data_blocks);
412                 }
413
414                 if (p->midi_ports)
415                         write_midi_messages(s, buf, data_blocks);
416
417                 // TODO: how to interact control messages between userspace?
418
419                 write_sph(p->cache, buf, data_blocks, s->data_block_quadlets);
420         }
421
422         // For tracepoints.
423         if (trace_data_block_sph_enabled() ||
424             trace_data_block_message_enabled())
425                 probe_tracepoints_events(s, descs, packets);
426
427         return pcm_frames;
428 }
429
430 int amdtp_motu_init(struct amdtp_stream *s, struct fw_unit *unit,
431                     enum amdtp_stream_direction dir,
432                     const struct snd_motu_spec *spec, struct amdtp_motu_cache *cache)
433 {
434         amdtp_stream_process_ctx_payloads_t process_ctx_payloads;
435         int fmt = CIP_FMT_MOTU;
436         unsigned int flags = CIP_BLOCKING | CIP_UNAWARE_SYT;
437         struct amdtp_motu *p;
438         int err;
439
440         if (dir == AMDTP_IN_STREAM) {
441                 process_ctx_payloads = process_ir_ctx_payloads;
442
443                 /*
444                  * Units of version 3 transmits packets with invalid CIP header
445                  * against IEC 61883-1.
446                  */
447                 if (spec->protocol_version == SND_MOTU_PROTOCOL_V3) {
448                         flags |= CIP_WRONG_DBS |
449                                  CIP_SKIP_DBC_ZERO_CHECK |
450                                  CIP_HEADER_WITHOUT_EOH;
451                         fmt = CIP_FMT_MOTU_TX_V3;
452                 }
453
454                 if (spec == &snd_motu_spec_8pre ||
455                     spec == &snd_motu_spec_ultralite) {
456                         // 8pre has some quirks.
457                         flags |= CIP_WRONG_DBS |
458                                  CIP_SKIP_DBC_ZERO_CHECK;
459                 }
460         } else {
461                 process_ctx_payloads = process_it_ctx_payloads;
462                 flags |= CIP_DBC_IS_END_EVENT;
463         }
464
465         err = amdtp_stream_init(s, unit, dir, flags, fmt, process_ctx_payloads,
466                                 sizeof(struct amdtp_motu));
467         if (err < 0)
468                 return err;
469
470         s->sph = 1;
471
472         if (dir == AMDTP_OUT_STREAM) {
473                 // Use fixed value for FDF field.
474                 s->ctx_data.rx.fdf = MOTU_FDF_AM824;
475         }
476
477         p = s->protocol;
478         p->cache = cache;
479
480         return 0;
481 }