mirror of
https://github.com/RIOT-OS/RIOT.git
synced 2024-12-29 04:50:03 +01:00
206 lines
8.8 KiB
C
206 lines
8.8 KiB
C
|
/*
|
||
|
* Copyright 2019 Marian Buschsieweke
|
||
|
*
|
||
|
* This file is subject to the terms and conditions of the GNU Lesser
|
||
|
* General Public License v2.1. See the file LICENSE in the top level
|
||
|
* directory for more details.
|
||
|
*/
|
||
|
|
||
|
/**
|
||
|
* @ingroup drivers_ws281x
|
||
|
*
|
||
|
* @{
|
||
|
*
|
||
|
* @file
|
||
|
* @brief Implementation of `ws281x_write()` for ATmega MCUs
|
||
|
*
|
||
|
* @author Marian Buschsieweke <marian.buschsieweke@ovgu.de>
|
||
|
*
|
||
|
* @}
|
||
|
*/
|
||
|
#include <assert.h>
|
||
|
#include <errno.h>
|
||
|
#include <stdint.h>
|
||
|
#include <string.h>
|
||
|
|
||
|
#include "atmega_gpio.h"
|
||
|
#include "ws281x.h"
|
||
|
#include "ws281x_params.h"
|
||
|
#include "ws281x_constants.h"
|
||
|
#include "periph_cpu.h"
|
||
|
#include "xtimer.h"
|
||
|
/*
|
||
|
* Data encoding according to the datasheets of the WS2812 and the SK6812:
|
||
|
* - Encoding of zero bit:
|
||
|
* 1. High for 325ns ± 125ns (average of WS2812 and SK6812)
|
||
|
* 2. Low for 850ns ± 100ns (average of WS2812 and SK6812)
|
||
|
* - Encoding of one bit:
|
||
|
* 1. High for 650ns ± 100ns (average of WS2812 and SK6812)
|
||
|
* 2. Low for 600ns ± 150ns (for both WS2812 and SK6812)
|
||
|
*
|
||
|
* While the data sheet claims the opposite, the precision requirement for
|
||
|
* the duration of the second phase (the low period) is in reality super
|
||
|
* lax. Therefore, we bit bang the high period precisely in inline assembly,
|
||
|
* and completely ignore the timing of the low phase. This works just fine.
|
||
|
*
|
||
|
* Further: For an 8MHz clock, we need a single CPU cycle access to the
|
||
|
* GPIO port. The is only possible with the `out` instruction, which takes
|
||
|
* the port to write to as immediate. Thus, it has to be known at compile
|
||
|
* time. We therefore simply provide 3 implementations for each of the
|
||
|
* three most commonly used GPIO ports. For the 16MHz version accessing the
|
||
|
* GPIO port via memory using the st instruction works fine, so no limitations
|
||
|
* on the GPIO por there.
|
||
|
*
|
||
|
* On final trick: A relative jump to the next instructions takes two
|
||
|
* CPU cycles; this, its 2 NOPs for the price of one (in terms of ROM
|
||
|
* consumption).
|
||
|
*
|
||
|
* High phase timings
|
||
|
*
|
||
|
* +------------+-------------------+-------------------+-------------------+
|
||
|
* | Data | Device/Frequency | Min | Max |
|
||
|
* +------------+-------------------+-------------------+-------------------+
|
||
|
* | 0 bit | WS2812 | 200ns | 500ns |
|
||
|
* | 1 bit | WS2812 | 550ns | 850ns (*) |
|
||
|
* +------------+-------------------+-------------------+-------------------+
|
||
|
* | 0 bit | SK6812 | 150ns | 450ns |
|
||
|
* | 1 bit | SK6812 | 450ns | 750ns |
|
||
|
* +------------+-------------------+-------------------+-------------------+
|
||
|
* | 0 bit | WS2812/SK6812 | 200ns | 450ns |
|
||
|
* | 1 bit | WS2812/SK6812 | 550ns | 750ns |
|
||
|
* +------------+-------------------+-------------------+-------------------+
|
||
|
* | 0 bit | 8 MHz | 2 Cycles (250ns) | 3 Cycles (375ns) |
|
||
|
* | 1 bit | 8 MHz | 5 Cycles (625ns) | 6 Cycles (750ns) |
|
||
|
* +------------+-------------------+-------------------+-------------------+
|
||
|
* | 0 bit | 16 MHz | 4 Cycles (250ns) | 7 Cycles (438ns) |
|
||
|
* | 1 bit | 16 MHz | 9 Cycles (563ns) | 12 Cycles (750ns) |
|
||
|
* +------------+-------------------+-------------------+-------------------+
|
||
|
*
|
||
|
* (*) The high time for encoding a 1 bit on the WS2812 has no upper bound in
|
||
|
* practise; A high period of 5 seconds has been reported to work reliable.
|
||
|
*/
|
||
|
|
||
|
void ws281x_write_buffer(ws281x_t *dev, const void *buf, size_t size)
|
||
|
{
|
||
|
assert(dev);
|
||
|
const uint8_t *pos = buf;
|
||
|
const uint8_t *end = pos + size;
|
||
|
uint16_t port_addr = atmega_port_addr(dev->params.pin);
|
||
|
uint8_t mask_on, mask_off;
|
||
|
|
||
|
{
|
||
|
uint8_t port_state = _SFR_MEM8(port_addr);
|
||
|
mask_on = port_state | (1 << atmega_pin_num(dev->params.pin));
|
||
|
mask_off = port_state & ~(1 << atmega_pin_num(dev->params.pin));
|
||
|
}
|
||
|
|
||
|
#if (CLOCK_CORECLOCK >= 7500000U) && (CLOCK_CORECLOCK <= 8500000U)
|
||
|
const uint8_t port_num = atmega_port_num(dev->params.pin);
|
||
|
switch (port_num) {
|
||
|
case PORT_B:
|
||
|
while (pos < end) {
|
||
|
uint8_t cnt = 8;
|
||
|
uint8_t data = *pos;
|
||
|
while (cnt > 0) {
|
||
|
__asm__ volatile( /* Cycles | 1 | 0 */
|
||
|
"out %[port], %[on]" "\n\t" /* 1 | x | x */
|
||
|
"sbrs %[data], 7" "\n\t" /* 1 | x | x */
|
||
|
"out %[port], %[off]" "\n\t" /* 1 | - | x */
|
||
|
"rjmp .+0" "\n\t" /* 2 | x | x */
|
||
|
"out %[port], %[off]" "\n\t" /* 1 | x | x */
|
||
|
/* Total CPU cycles for high period:
|
||
|
* 5 cycles for bit 1, 2 cycles for bit 0 */
|
||
|
: [data] "+r" (data)
|
||
|
: [port] "I" (_SFR_IO_ADDR(PORTB)),
|
||
|
[on] "r" (mask_on),
|
||
|
[off] "r" (mask_off)
|
||
|
);
|
||
|
cnt--;
|
||
|
data <<= 1;
|
||
|
}
|
||
|
pos++;
|
||
|
}
|
||
|
break;
|
||
|
case PORT_C:
|
||
|
while (pos < end) {
|
||
|
uint8_t cnt = 8;
|
||
|
uint8_t data = *pos;
|
||
|
while (cnt > 0) {
|
||
|
__asm__ volatile( /* Cycles | 1 | 0 */
|
||
|
"out %[port], %[on]" "\n\t" /* 1 | x | x */
|
||
|
"sbrs %[data], 7" "\n\t" /* 1 | x | x */
|
||
|
"out %[port], %[off]" "\n\t" /* 1 | - | x */
|
||
|
"rjmp .+0" "\n\t" /* 2 | x | x */
|
||
|
"out %[port], %[off]" "\n\t" /* 1 | x | x */
|
||
|
/* Total CPU cycles for high period:
|
||
|
* 5 cycles for bit 1, 2 cycles for bit 0 */
|
||
|
: [data] "+r" (data)
|
||
|
: [port] "I" (_SFR_IO_ADDR(PORTC)),
|
||
|
[on] "r" (mask_on),
|
||
|
[off] "r" (mask_off)
|
||
|
);
|
||
|
cnt--;
|
||
|
data <<= 1;
|
||
|
}
|
||
|
pos++;
|
||
|
}
|
||
|
break;
|
||
|
case PORT_D:
|
||
|
while (pos < end) {
|
||
|
uint8_t cnt = 8;
|
||
|
uint8_t data = *pos;
|
||
|
while (cnt > 0) {
|
||
|
__asm__ volatile( /* Cycles | 1 | 0 */
|
||
|
"out %[port], %[on]" "\n\t" /* 1 | x | x */
|
||
|
"sbrs %[data], 7" "\n\t" /* 1 | x | x */
|
||
|
"out %[port], %[off]" "\n\t" /* 1 | - | x */
|
||
|
"rjmp .+0" "\n\t" /* 2 | x | x */
|
||
|
"out %[port], %[off]" "\n\t" /* 1 | x | x */
|
||
|
/* Total CPU cycles for high period:
|
||
|
* 5 cycles for bit 1, 2 cycles for bit 0 */
|
||
|
: [data] "+r" (data)
|
||
|
: [port] "I" (_SFR_IO_ADDR(PORTD)),
|
||
|
[on] "r" (mask_on),
|
||
|
[off] "r" (mask_off)
|
||
|
);
|
||
|
cnt--;
|
||
|
data <<= 1;
|
||
|
}
|
||
|
pos++;
|
||
|
}
|
||
|
break;
|
||
|
default:
|
||
|
assert(0);
|
||
|
break;
|
||
|
}
|
||
|
#elif (CLOCK_CORECLOCK >= 15500000U) && (CLOCK_CORECLOCK <= 16500000U)
|
||
|
while (pos < end) {
|
||
|
uint8_t cnt = 8;
|
||
|
uint8_t data = *pos;
|
||
|
while (cnt > 0) {
|
||
|
__asm__ volatile( /* CPU Cycles | 1 | 0 */
|
||
|
"st %a[port], %[on]" "\n\t" /* 2 | x | x */
|
||
|
"sbrc %[data], 7" "\n\t" /* 1 | x | x */
|
||
|
"rjmp .+0" "\n\t" /* 2 | x | - */
|
||
|
"sbrc %[data], 7" "\n\t" /* 1 | x | x */
|
||
|
"rjmp .+0" "\n\t" /* 2 | x | - */
|
||
|
"sbrc %[data], 7" "\n\t" /* 1 | x | x */
|
||
|
"nop" "\n\t" /* 1 | x | - */
|
||
|
"st %a[port], %[off]" "\n\t" /* 2 | x | x */
|
||
|
/* Total CPU cycles for high period:
|
||
|
* 10 cycles for bit 1, 5 cycles for bit 0 */
|
||
|
: [data] "+r" (data)
|
||
|
: [on] "r" (mask_on),
|
||
|
[port] "e" (port_addr),
|
||
|
[off] "r" (mask_off)
|
||
|
);
|
||
|
cnt--;
|
||
|
data <<= 1;
|
||
|
}
|
||
|
pos++;
|
||
|
}
|
||
|
#else
|
||
|
#error "No low level WS281x implementation for ATmega CPUs for your CPU clock"
|
||
|
#endif
|
||
|
}
|