3723 lines
127 KiB
C++
3723 lines
127 KiB
C++
/*!
|
|
* @file Adafruit_NeoPixel.cpp
|
|
*
|
|
* @mainpage Arduino Library for driving Adafruit NeoPixel addressable LEDs,
|
|
* FLORA RGB Smart Pixels and compatible devicess -- WS2811, WS2812, WS2812B,
|
|
* SK6812, etc.
|
|
*
|
|
* @section intro_sec Introduction
|
|
*
|
|
* This is the documentation for Adafruit's NeoPixel library for the
|
|
* Arduino platform, allowing a broad range of microcontroller boards
|
|
* (most AVR boards, many ARM devices, ESP8266 and ESP32, among others)
|
|
* to control Adafruit NeoPixels, FLORA RGB Smart Pixels and compatible
|
|
* devices -- WS2811, WS2812, WS2812B, SK6812, etc.
|
|
*
|
|
* Adafruit invests time and resources providing this open source code,
|
|
* please support Adafruit and open-source hardware by purchasing products
|
|
* from Adafruit!
|
|
*
|
|
* @section author Author
|
|
*
|
|
* Written by Phil "Paint Your Dragon" Burgess for Adafruit Industries,
|
|
* with contributions by PJRC, Michael Miller and other members of the
|
|
* open source community.
|
|
*
|
|
* @section license License
|
|
*
|
|
* This file is part of the Adafruit_NeoPixel library.
|
|
*
|
|
* Adafruit_NeoPixel is free software: you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public License as
|
|
* published by the Free Software Foundation, either version 3 of the
|
|
* License, or (at your option) any later version.
|
|
*
|
|
* Adafruit_NeoPixel is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with NeoPixel. If not, see
|
|
* <http://www.gnu.org/licenses/>.
|
|
*
|
|
*/
|
|
|
|
#include "Adafruit_NeoPixel.h"
|
|
|
|
#if defined(TARGET_LPC1768)
|
|
#include <time.h>
|
|
#endif
|
|
|
|
#if defined(NRF52) || defined(NRF52_SERIES)
|
|
#include "nrf.h"
|
|
|
|
// Interrupt is only disabled if there is no PWM device available
|
|
// Note: Adafruit Bluefruit nrf52 does not use this option
|
|
//#define NRF52_DISABLE_INT
|
|
#endif
|
|
|
|
#if defined(ARDUINO_ARCH_NRF52840)
|
|
#if defined __has_include
|
|
#if __has_include(<pinDefinitions.h>)
|
|
#include <pinDefinitions.h>
|
|
#endif
|
|
#endif
|
|
#endif
|
|
|
|
/*!
|
|
@brief NeoPixel constructor when length, pin and pixel type are known
|
|
at compile-time.
|
|
@param n Number of NeoPixels in strand.
|
|
@param p Arduino pin number which will drive the NeoPixel data in.
|
|
@param t Pixel type -- add together NEO_* constants defined in
|
|
Adafruit_NeoPixel.h, for example NEO_GRB+NEO_KHZ800 for
|
|
NeoPixels expecting an 800 KHz (vs 400 KHz) data stream
|
|
with color bytes expressed in green, red, blue order per
|
|
pixel.
|
|
@return Adafruit_NeoPixel object. Call the begin() function before use.
|
|
*/
|
|
Adafruit_NeoPixel::Adafruit_NeoPixel(uint16_t n, int16_t p, neoPixelType t)
|
|
: begun(false), brightness(0), pixels(NULL), endTime(0) {
|
|
updateType(t);
|
|
updateLength(n);
|
|
setPin(p);
|
|
#if defined(ARDUINO_ARCH_RP2040)
|
|
// Find a free SM on one of the PIO's
|
|
sm = pio_claim_unused_sm(pio, false); // don't panic
|
|
// Try pio1 if SM not found
|
|
if (sm < 0) {
|
|
pio = pio1;
|
|
sm = pio_claim_unused_sm(pio, true); // panic if no SM is free
|
|
}
|
|
init = true;
|
|
#endif
|
|
}
|
|
|
|
/*!
|
|
@brief "Empty" NeoPixel constructor when length, pin and/or pixel type
|
|
are not known at compile-time, and must be initialized later with
|
|
updateType(), updateLength() and setPin().
|
|
@return Adafruit_NeoPixel object. Call the begin() function before use.
|
|
@note This function is deprecated, here only for old projects that
|
|
may still be calling it. New projects should instead use the
|
|
'new' keyword with the first constructor syntax (length, pin,
|
|
type).
|
|
*/
|
|
Adafruit_NeoPixel::Adafruit_NeoPixel()
|
|
:
|
|
#if defined(NEO_KHZ400)
|
|
is800KHz(true),
|
|
#endif
|
|
begun(false), numLEDs(0), numBytes(0), pin(-1), brightness(0),
|
|
pixels(NULL), rOffset(1), gOffset(0), bOffset(2), wOffset(1), endTime(0) {
|
|
}
|
|
|
|
/*!
|
|
@brief Deallocate Adafruit_NeoPixel object, set data pin back to INPUT.
|
|
*/
|
|
Adafruit_NeoPixel::~Adafruit_NeoPixel() {
|
|
free(pixels);
|
|
if (pin >= 0)
|
|
pinMode(pin, INPUT);
|
|
}
|
|
|
|
/*!
|
|
@brief Configure NeoPixel pin for output.
|
|
*/
|
|
void Adafruit_NeoPixel::begin(void) {
|
|
if (pin >= 0) {
|
|
pinMode(pin, OUTPUT);
|
|
digitalWrite(pin, LOW);
|
|
}
|
|
begun = true;
|
|
}
|
|
|
|
/*!
|
|
@brief Change the length of a previously-declared Adafruit_NeoPixel
|
|
strip object. Old data is deallocated and new data is cleared.
|
|
Pin number and pixel format are unchanged.
|
|
@param n New length of strip, in pixels.
|
|
@note This function is deprecated, here only for old projects that
|
|
may still be calling it. New projects should instead use the
|
|
'new' keyword with the first constructor syntax (length, pin,
|
|
type).
|
|
*/
|
|
void Adafruit_NeoPixel::updateLength(uint16_t n) {
|
|
free(pixels); // Free existing data (if any)
|
|
|
|
// Allocate new data -- note: ALL PIXELS ARE CLEARED
|
|
numBytes = n * ((wOffset == rOffset) ? 3 : 4);
|
|
if ((pixels = (uint8_t *)malloc(numBytes))) {
|
|
memset(pixels, 0, numBytes);
|
|
numLEDs = n;
|
|
} else {
|
|
numLEDs = numBytes = 0;
|
|
}
|
|
}
|
|
|
|
/*!
|
|
@brief Change the pixel format of a previously-declared
|
|
Adafruit_NeoPixel strip object. If format changes from one of
|
|
the RGB variants to an RGBW variant (or RGBW to RGB), the old
|
|
data will be deallocated and new data is cleared. Otherwise,
|
|
the old data will remain in RAM and is not reordered to the
|
|
new format, so it's advisable to follow up with clear().
|
|
@param t Pixel type -- add together NEO_* constants defined in
|
|
Adafruit_NeoPixel.h, for example NEO_GRB+NEO_KHZ800 for
|
|
NeoPixels expecting an 800 KHz (vs 400 KHz) data stream
|
|
with color bytes expressed in green, red, blue order per
|
|
pixel.
|
|
@note This function is deprecated, here only for old projects that
|
|
may still be calling it. New projects should instead use the
|
|
'new' keyword with the first constructor syntax
|
|
(length, pin, type).
|
|
*/
|
|
void Adafruit_NeoPixel::updateType(neoPixelType t) {
|
|
bool oldThreeBytesPerPixel = (wOffset == rOffset); // false if RGBW
|
|
|
|
wOffset = (t >> 6) & 0b11; // See notes in header file
|
|
rOffset = (t >> 4) & 0b11; // regarding R/G/B/W offsets
|
|
gOffset = (t >> 2) & 0b11;
|
|
bOffset = t & 0b11;
|
|
#if defined(NEO_KHZ400)
|
|
is800KHz = (t < 256); // 400 KHz flag is 1<<8
|
|
#endif
|
|
|
|
// If bytes-per-pixel has changed (and pixel data was previously
|
|
// allocated), re-allocate to new size. Will clear any data.
|
|
if (pixels) {
|
|
bool newThreeBytesPerPixel = (wOffset == rOffset);
|
|
if (newThreeBytesPerPixel != oldThreeBytesPerPixel)
|
|
updateLength(numLEDs);
|
|
}
|
|
}
|
|
|
|
// RP2040 specific driver
|
|
#if defined(ARDUINO_ARCH_RP2040)
|
|
void Adafruit_NeoPixel::rp2040Init(uint8_t pin, bool is800KHz)
|
|
{
|
|
uint offset = pio_add_program(pio, &ws2812_program);
|
|
|
|
if (is800KHz)
|
|
{
|
|
// 800kHz, 8 bit transfers
|
|
ws2812_program_init(pio, sm, offset, pin, 800000, 8);
|
|
}
|
|
else
|
|
{
|
|
// 400kHz, 8 bit transfers
|
|
ws2812_program_init(pio, sm, offset, pin, 400000, 8);
|
|
}
|
|
}
|
|
// Not a user API
|
|
void Adafruit_NeoPixel::rp2040Show(uint8_t pin, uint8_t *pixels, uint32_t numBytes, bool is800KHz)
|
|
{
|
|
if (this->init)
|
|
{
|
|
// On first pass through initialise the PIO
|
|
rp2040Init(pin, is800KHz);
|
|
this->init = false;
|
|
}
|
|
|
|
while(numBytes--)
|
|
// Bits for transmission must be shifted to top 8 bits
|
|
pio_sm_put_blocking(pio, sm, ((uint32_t)*pixels++)<< 24);
|
|
}
|
|
#elif defined(ARDUINO_ARCH_CH32)
|
|
|
|
// F_CPU is defined to SystemCoreClock (not constant number)
|
|
#if SYSCLK_FREQ_144MHz_HSE == 144000000 || SYSCLK_FREQ_HSE == 144000000 || \
|
|
SYSCLK_FREQ_144MHz_HSI == 144000000 || SYSCLK_FREQ_HSI == 144000000
|
|
#define CH32_F_CPU 144000000
|
|
|
|
#elif SYSCLK_FREQ_120MHz_HSE == 120000000 || SYSCLK_FREQ_HSE == 120000000 || \
|
|
SYSCLK_FREQ_120MHz_HSI == 120000000 || SYSCLK_FREQ_HSI == 120000000
|
|
#define CH32_F_CPU 120000000
|
|
|
|
#elif SYSCLK_FREQ_96MHz_HSE == 96000000 || SYSCLK_FREQ_HSE == 96000000 || \
|
|
SYSCLK_FREQ_96MHz_HSI == 96000000 || SYSCLK_FREQ_HSI == 96000000
|
|
#define CH32_F_CPU 96000000
|
|
|
|
#elif SYSCLK_FREQ_72MHz_HSE == 72000000 || SYSCLK_FREQ_HSE == 72000000 || \
|
|
SYSCLK_FREQ_72MHz_HSI == 72000000 || SYSCLK_FREQ_HSI == 72000000
|
|
#define CH32_F_CPU 72000000
|
|
|
|
#elif SYSCLK_FREQ_56MHz_HSE == 56000000 || SYSCLK_FREQ_HSE == 56000000 || \
|
|
SYSCLK_FREQ_56MHz_HSI == 56000000 || SYSCLK_FREQ_HSI == 56000000
|
|
#define CH32_F_CPU 56000000
|
|
|
|
#elif SYSCLK_FREQ_48MHz_HSE == 48000000 || SYSCLK_FREQ_HSE == 48000000 || \
|
|
SYSCLK_FREQ_48MHz_HSI == 48000000 || SYSCLK_FREQ_HSI == 48000000
|
|
#define CH32_F_CPU 48000000
|
|
|
|
#endif
|
|
|
|
static void ch32Show(GPIO_TypeDef* ch_port, uint32_t ch_pin, uint8_t* pixels, uint32_t numBytes, bool is800KHz) {
|
|
// not support 400khz
|
|
if (!is800KHz) return;
|
|
|
|
volatile uint32_t* set = &ch_port->BSHR;
|
|
volatile uint32_t* clr = &ch_port->BCR;
|
|
|
|
uint8_t* ptr = pixels;
|
|
uint8_t* end = ptr + numBytes;
|
|
uint8_t p = *ptr++;
|
|
uint8_t bitMask = 0x80;
|
|
|
|
// NVIC_DisableIRQ(SysTicK_IRQn);
|
|
|
|
while (1) {
|
|
if (p & bitMask) { // ONE
|
|
// High 800ns
|
|
*set = ch_pin;
|
|
__asm volatile ("nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop;"
|
|
#if CH32_F_CPU >= 72000000
|
|
"nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop;"
|
|
#endif
|
|
#if CH32_F_CPU >= 96000000
|
|
"nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
#endif
|
|
#if CH32_F_CPU >= 120000000
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
#endif
|
|
#if CH32_F_CPU >= 144000000
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
#endif
|
|
);
|
|
|
|
// Low 450ns
|
|
*clr = ch_pin;
|
|
__asm volatile ("nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop;"
|
|
#if CH32_F_CPU >= 72000000
|
|
"nop; nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
#endif
|
|
#if CH32_F_CPU >= 96000000
|
|
"nop; nop; nop; nop; nop; nop;"
|
|
#endif
|
|
#if CH32_F_CPU >= 120000000
|
|
"nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
#endif
|
|
#if CH32_F_CPU >= 144000000
|
|
"nop; nop; nop; nop; nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
#endif
|
|
);
|
|
} else { // ZERO
|
|
// High 400ns
|
|
*set = ch_pin;
|
|
__asm volatile ("nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop;"
|
|
#if CH32_F_CPU >= 72000000
|
|
"nop; nop; nop; nop; nop; nop; nop;"
|
|
#endif
|
|
#if CH32_F_CPU >= 96000000
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
#endif
|
|
#if CH32_F_CPU >= 120000000
|
|
"nop; nop; nop; "
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
#endif
|
|
#if CH32_F_CPU >= 144000000
|
|
"nop; nop; nop; nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
#endif
|
|
);
|
|
|
|
// Low 850ns
|
|
*clr = ch_pin;
|
|
__asm volatile ("nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop;"
|
|
#if CH32_F_CPU >= 72000000
|
|
"nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
#endif
|
|
#if CH32_F_CPU >= 96000000
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop;"
|
|
#endif
|
|
#if CH32_F_CPU >= 120000000
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop;"
|
|
#endif
|
|
#if CH32_F_CPU >= 144000000
|
|
"nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
#endif
|
|
);
|
|
}
|
|
|
|
if (bitMask >>= 1) {
|
|
// Move on to the next pixel
|
|
asm("nop;");
|
|
}
|
|
else {
|
|
if (ptr >= end) {
|
|
break;
|
|
}
|
|
p = *ptr++;
|
|
bitMask = 0x80;
|
|
}
|
|
}
|
|
|
|
// NVIC_EnableIRQ(SysTicK_IRQn);
|
|
}
|
|
#endif
|
|
|
|
#if defined(ESP8266)
|
|
// ESP8266 show() is external to enforce ICACHE_RAM_ATTR execution
|
|
extern "C" IRAM_ATTR void espShow(uint16_t pin, uint8_t *pixels,
|
|
uint32_t numBytes, uint8_t type);
|
|
#elif defined(ESP32)
|
|
extern "C" void espShow(uint16_t pin, uint8_t *pixels, uint32_t numBytes,
|
|
uint8_t type);
|
|
#endif // ESP8266
|
|
|
|
#if defined(K210)
|
|
#define KENDRYTE_K210 1
|
|
#endif
|
|
|
|
#if defined(KENDRYTE_K210)
|
|
extern "C" void k210Show(uint8_t pin, uint8_t *pixels, uint32_t numBytes,
|
|
boolean is800KHz);
|
|
#endif // KENDRYTE_K210
|
|
/*!
|
|
@brief Transmit pixel data in RAM to NeoPixels.
|
|
@note On most architectures, interrupts are temporarily disabled in
|
|
order to achieve the correct NeoPixel signal timing. This means
|
|
that the Arduino millis() and micros() functions, which require
|
|
interrupts, will lose small intervals of time whenever this
|
|
function is called (about 30 microseconds per RGB pixel, 40 for
|
|
RGBW pixels). There's no easy fix for this, but a few
|
|
specialized alternative or companion libraries exist that use
|
|
very device-specific peripherals to work around it.
|
|
*/
|
|
void Adafruit_NeoPixel::show(void) {
|
|
|
|
if (!pixels)
|
|
return;
|
|
|
|
// Data latch = 300+ microsecond pause in the output stream. Rather than
|
|
// put a delay at the end of the function, the ending time is noted and
|
|
// the function will simply hold off (if needed) on issuing the
|
|
// subsequent round of data until the latch time has elapsed. This
|
|
// allows the mainline code to start generating the next frame of data
|
|
// rather than stalling for the latch.
|
|
while (!canShow())
|
|
;
|
|
// endTime is a private member (rather than global var) so that multiple
|
|
// instances on different pins can be quickly issued in succession (each
|
|
// instance doesn't delay the next).
|
|
|
|
// In order to make this code runtime-configurable to work with any pin,
|
|
// SBI/CBI instructions are eschewed in favor of full PORT writes via the
|
|
// OUT or ST instructions. It relies on two facts: that peripheral
|
|
// functions (such as PWM) take precedence on output pins, so our PORT-
|
|
// wide writes won't interfere, and that interrupts are globally disabled
|
|
// while data is being issued to the LEDs, so no other code will be
|
|
// accessing the PORT. The code takes an initial 'snapshot' of the PORT
|
|
// state, computes 'pin high' and 'pin low' values, and writes these back
|
|
// to the PORT register as needed.
|
|
|
|
// NRF52 may use PWM + DMA (if available), may not need to disable interrupt
|
|
// ESP32 may not disable interrupts because espShow() uses RMT which tries to acquire locks
|
|
#if !(defined(NRF52) || defined(NRF52_SERIES) || defined(ESP32))
|
|
noInterrupts(); // Need 100% focus on instruction timing
|
|
#endif
|
|
|
|
#if defined(__AVR__)
|
|
// AVR MCUs -- ATmega & ATtiny (no XMEGA) ---------------------------------
|
|
|
|
volatile uint16_t i = numBytes; // Loop counter
|
|
volatile uint8_t *ptr = pixels, // Pointer to next byte
|
|
b = *ptr++, // Current byte value
|
|
hi, // PORT w/output bit set high
|
|
lo; // PORT w/output bit set low
|
|
|
|
// Hand-tuned assembly code issues data to the LED drivers at a specific
|
|
// rate. There's separate code for different CPU speeds (8, 12, 16 MHz)
|
|
// for both the WS2811 (400 KHz) and WS2812 (800 KHz) drivers. The
|
|
// datastream timing for the LED drivers allows a little wiggle room each
|
|
// way (listed in the datasheets), so the conditions for compiling each
|
|
// case are set up for a range of frequencies rather than just the exact
|
|
// 8, 12 or 16 MHz values, permitting use with some close-but-not-spot-on
|
|
// devices (e.g. 16.5 MHz DigiSpark). The ranges were arrived at based
|
|
// on the datasheet figures and have not been extensively tested outside
|
|
// the canonical 8/12/16 MHz speeds; there's no guarantee these will work
|
|
// close to the extremes (or possibly they could be pushed further).
|
|
// Keep in mind only one CPU speed case actually gets compiled; the
|
|
// resulting program isn't as massive as it might look from source here.
|
|
|
|
// 8 MHz(ish) AVR ---------------------------------------------------------
|
|
#if (F_CPU >= 7400000UL) && (F_CPU <= 9500000UL)
|
|
|
|
#if defined(NEO_KHZ400) // 800 KHz check needed only if 400 KHz support enabled
|
|
if (is800KHz) {
|
|
#endif
|
|
|
|
volatile uint8_t n1, n2 = 0; // First, next bits out
|
|
|
|
// Squeezing an 800 KHz stream out of an 8 MHz chip requires code
|
|
// specific to each PORT register.
|
|
|
|
// 10 instruction clocks per bit: HHxxxxxLLL
|
|
// OUT instructions: ^ ^ ^ (T=0,2,7)
|
|
|
|
// PORTD OUTPUT ----------------------------------------------------
|
|
|
|
#if defined(PORTD)
|
|
#if defined(PORTB) || defined(PORTC) || defined(PORTF)
|
|
if (port == &PORTD) {
|
|
#endif // defined(PORTB/C/F)
|
|
|
|
hi = PORTD | pinMask;
|
|
lo = PORTD & ~pinMask;
|
|
n1 = lo;
|
|
if (b & 0x80)
|
|
n1 = hi;
|
|
|
|
// Dirty trick: RJMPs proceeding to the next instruction are used
|
|
// to delay two clock cycles in one instruction word (rather than
|
|
// using two NOPs). This was necessary in order to squeeze the
|
|
// loop down to exactly 64 words -- the maximum possible for a
|
|
// relative branch.
|
|
|
|
asm volatile(
|
|
"headD:"
|
|
"\n\t" // Clk Pseudocode
|
|
// Bit 7:
|
|
"out %[port] , %[hi]"
|
|
"\n\t" // 1 PORT = hi
|
|
"mov %[n2] , %[lo]"
|
|
"\n\t" // 1 n2 = lo
|
|
"out %[port] , %[n1]"
|
|
"\n\t" // 1 PORT = n1
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop
|
|
"sbrc %[byte] , 6"
|
|
"\n\t" // 1-2 if(b & 0x40)
|
|
"mov %[n2] , %[hi]"
|
|
"\n\t" // 0-1 n2 = hi
|
|
"out %[port] , %[lo]"
|
|
"\n\t" // 1 PORT = lo
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop
|
|
// Bit 6:
|
|
"out %[port] , %[hi]"
|
|
"\n\t" // 1 PORT = hi
|
|
"mov %[n1] , %[lo]"
|
|
"\n\t" // 1 n1 = lo
|
|
"out %[port] , %[n2]"
|
|
"\n\t" // 1 PORT = n2
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop
|
|
"sbrc %[byte] , 5"
|
|
"\n\t" // 1-2 if(b & 0x20)
|
|
"mov %[n1] , %[hi]"
|
|
"\n\t" // 0-1 n1 = hi
|
|
"out %[port] , %[lo]"
|
|
"\n\t" // 1 PORT = lo
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop
|
|
// Bit 5:
|
|
"out %[port] , %[hi]"
|
|
"\n\t" // 1 PORT = hi
|
|
"mov %[n2] , %[lo]"
|
|
"\n\t" // 1 n2 = lo
|
|
"out %[port] , %[n1]"
|
|
"\n\t" // 1 PORT = n1
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop
|
|
"sbrc %[byte] , 4"
|
|
"\n\t" // 1-2 if(b & 0x10)
|
|
"mov %[n2] , %[hi]"
|
|
"\n\t" // 0-1 n2 = hi
|
|
"out %[port] , %[lo]"
|
|
"\n\t" // 1 PORT = lo
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop
|
|
// Bit 4:
|
|
"out %[port] , %[hi]"
|
|
"\n\t" // 1 PORT = hi
|
|
"mov %[n1] , %[lo]"
|
|
"\n\t" // 1 n1 = lo
|
|
"out %[port] , %[n2]"
|
|
"\n\t" // 1 PORT = n2
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop
|
|
"sbrc %[byte] , 3"
|
|
"\n\t" // 1-2 if(b & 0x08)
|
|
"mov %[n1] , %[hi]"
|
|
"\n\t" // 0-1 n1 = hi
|
|
"out %[port] , %[lo]"
|
|
"\n\t" // 1 PORT = lo
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop
|
|
// Bit 3:
|
|
"out %[port] , %[hi]"
|
|
"\n\t" // 1 PORT = hi
|
|
"mov %[n2] , %[lo]"
|
|
"\n\t" // 1 n2 = lo
|
|
"out %[port] , %[n1]"
|
|
"\n\t" // 1 PORT = n1
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop
|
|
"sbrc %[byte] , 2"
|
|
"\n\t" // 1-2 if(b & 0x04)
|
|
"mov %[n2] , %[hi]"
|
|
"\n\t" // 0-1 n2 = hi
|
|
"out %[port] , %[lo]"
|
|
"\n\t" // 1 PORT = lo
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop
|
|
// Bit 2:
|
|
"out %[port] , %[hi]"
|
|
"\n\t" // 1 PORT = hi
|
|
"mov %[n1] , %[lo]"
|
|
"\n\t" // 1 n1 = lo
|
|
"out %[port] , %[n2]"
|
|
"\n\t" // 1 PORT = n2
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop
|
|
"sbrc %[byte] , 1"
|
|
"\n\t" // 1-2 if(b & 0x02)
|
|
"mov %[n1] , %[hi]"
|
|
"\n\t" // 0-1 n1 = hi
|
|
"out %[port] , %[lo]"
|
|
"\n\t" // 1 PORT = lo
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop
|
|
// Bit 1:
|
|
"out %[port] , %[hi]"
|
|
"\n\t" // 1 PORT = hi
|
|
"mov %[n2] , %[lo]"
|
|
"\n\t" // 1 n2 = lo
|
|
"out %[port] , %[n1]"
|
|
"\n\t" // 1 PORT = n1
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop
|
|
"sbrc %[byte] , 0"
|
|
"\n\t" // 1-2 if(b & 0x01)
|
|
"mov %[n2] , %[hi]"
|
|
"\n\t" // 0-1 n2 = hi
|
|
"out %[port] , %[lo]"
|
|
"\n\t" // 1 PORT = lo
|
|
"sbiw %[count], 1"
|
|
"\n\t" // 2 i-- (don't act on Z flag yet)
|
|
// Bit 0:
|
|
"out %[port] , %[hi]"
|
|
"\n\t" // 1 PORT = hi
|
|
"mov %[n1] , %[lo]"
|
|
"\n\t" // 1 n1 = lo
|
|
"out %[port] , %[n2]"
|
|
"\n\t" // 1 PORT = n2
|
|
"ld %[byte] , %a[ptr]+"
|
|
"\n\t" // 2 b = *ptr++
|
|
"sbrc %[byte] , 7"
|
|
"\n\t" // 1-2 if(b & 0x80)
|
|
"mov %[n1] , %[hi]"
|
|
"\n\t" // 0-1 n1 = hi
|
|
"out %[port] , %[lo]"
|
|
"\n\t" // 1 PORT = lo
|
|
"brne headD"
|
|
"\n" // 2 while(i) (Z flag set above)
|
|
: [byte] "+r"(b), [n1] "+r"(n1), [n2] "+r"(n2), [count] "+w"(i)
|
|
: [port] "I"(_SFR_IO_ADDR(PORTD)), [ptr] "e"(ptr), [hi] "r"(hi),
|
|
[lo] "r"(lo));
|
|
|
|
#if defined(PORTB) || defined(PORTC) || defined(PORTF)
|
|
} else // other PORT(s)
|
|
#endif // defined(PORTB/C/F)
|
|
#endif // defined(PORTD)
|
|
|
|
// PORTB OUTPUT ----------------------------------------------------
|
|
|
|
#if defined(PORTB)
|
|
#if defined(PORTD) || defined(PORTC) || defined(PORTF)
|
|
if (port == &PORTB) {
|
|
#endif // defined(PORTD/C/F)
|
|
|
|
// Same as above, just switched to PORTB and stripped of comments.
|
|
hi = PORTB | pinMask;
|
|
lo = PORTB & ~pinMask;
|
|
n1 = lo;
|
|
if (b & 0x80)
|
|
n1 = hi;
|
|
|
|
asm volatile(
|
|
"headB:"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"mov %[n2] , %[lo]"
|
|
"\n\t"
|
|
"out %[port] , %[n1]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"sbrc %[byte] , 6"
|
|
"\n\t"
|
|
"mov %[n2] , %[hi]"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"mov %[n1] , %[lo]"
|
|
"\n\t"
|
|
"out %[port] , %[n2]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"sbrc %[byte] , 5"
|
|
"\n\t"
|
|
"mov %[n1] , %[hi]"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"mov %[n2] , %[lo]"
|
|
"\n\t"
|
|
"out %[port] , %[n1]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"sbrc %[byte] , 4"
|
|
"\n\t"
|
|
"mov %[n2] , %[hi]"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"mov %[n1] , %[lo]"
|
|
"\n\t"
|
|
"out %[port] , %[n2]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"sbrc %[byte] , 3"
|
|
"\n\t"
|
|
"mov %[n1] , %[hi]"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"mov %[n2] , %[lo]"
|
|
"\n\t"
|
|
"out %[port] , %[n1]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"sbrc %[byte] , 2"
|
|
"\n\t"
|
|
"mov %[n2] , %[hi]"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"mov %[n1] , %[lo]"
|
|
"\n\t"
|
|
"out %[port] , %[n2]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"sbrc %[byte] , 1"
|
|
"\n\t"
|
|
"mov %[n1] , %[hi]"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"mov %[n2] , %[lo]"
|
|
"\n\t"
|
|
"out %[port] , %[n1]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"sbrc %[byte] , 0"
|
|
"\n\t"
|
|
"mov %[n2] , %[hi]"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"sbiw %[count], 1"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"mov %[n1] , %[lo]"
|
|
"\n\t"
|
|
"out %[port] , %[n2]"
|
|
"\n\t"
|
|
"ld %[byte] , %a[ptr]+"
|
|
"\n\t"
|
|
"sbrc %[byte] , 7"
|
|
"\n\t"
|
|
"mov %[n1] , %[hi]"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"brne headB"
|
|
"\n"
|
|
: [byte] "+r"(b), [n1] "+r"(n1), [n2] "+r"(n2), [count] "+w"(i)
|
|
: [port] "I"(_SFR_IO_ADDR(PORTB)), [ptr] "e"(ptr), [hi] "r"(hi),
|
|
[lo] "r"(lo));
|
|
|
|
#if defined(PORTD) || defined(PORTC) || defined(PORTF)
|
|
}
|
|
#endif
|
|
#if defined(PORTC) || defined(PORTF)
|
|
else
|
|
#endif // defined(PORTC/F)
|
|
#endif // defined(PORTB)
|
|
|
|
// PORTC OUTPUT ----------------------------------------------------
|
|
|
|
#if defined(PORTC)
|
|
#if defined(PORTD) || defined(PORTB) || defined(PORTF)
|
|
if (port == &PORTC) {
|
|
#endif // defined(PORTD/B/F)
|
|
|
|
// Same as above, just switched to PORTC and stripped of comments.
|
|
hi = PORTC | pinMask;
|
|
lo = PORTC & ~pinMask;
|
|
n1 = lo;
|
|
if (b & 0x80)
|
|
n1 = hi;
|
|
|
|
asm volatile(
|
|
"headC:"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"mov %[n2] , %[lo]"
|
|
"\n\t"
|
|
"out %[port] , %[n1]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"sbrc %[byte] , 6"
|
|
"\n\t"
|
|
"mov %[n2] , %[hi]"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"mov %[n1] , %[lo]"
|
|
"\n\t"
|
|
"out %[port] , %[n2]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"sbrc %[byte] , 5"
|
|
"\n\t"
|
|
"mov %[n1] , %[hi]"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"mov %[n2] , %[lo]"
|
|
"\n\t"
|
|
"out %[port] , %[n1]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"sbrc %[byte] , 4"
|
|
"\n\t"
|
|
"mov %[n2] , %[hi]"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"mov %[n1] , %[lo]"
|
|
"\n\t"
|
|
"out %[port] , %[n2]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"sbrc %[byte] , 3"
|
|
"\n\t"
|
|
"mov %[n1] , %[hi]"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"mov %[n2] , %[lo]"
|
|
"\n\t"
|
|
"out %[port] , %[n1]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"sbrc %[byte] , 2"
|
|
"\n\t"
|
|
"mov %[n2] , %[hi]"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"mov %[n1] , %[lo]"
|
|
"\n\t"
|
|
"out %[port] , %[n2]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"sbrc %[byte] , 1"
|
|
"\n\t"
|
|
"mov %[n1] , %[hi]"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"mov %[n2] , %[lo]"
|
|
"\n\t"
|
|
"out %[port] , %[n1]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"sbrc %[byte] , 0"
|
|
"\n\t"
|
|
"mov %[n2] , %[hi]"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"sbiw %[count], 1"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"mov %[n1] , %[lo]"
|
|
"\n\t"
|
|
"out %[port] , %[n2]"
|
|
"\n\t"
|
|
"ld %[byte] , %a[ptr]+"
|
|
"\n\t"
|
|
"sbrc %[byte] , 7"
|
|
"\n\t"
|
|
"mov %[n1] , %[hi]"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"brne headC"
|
|
"\n"
|
|
: [byte] "+r"(b), [n1] "+r"(n1), [n2] "+r"(n2), [count] "+w"(i)
|
|
: [port] "I"(_SFR_IO_ADDR(PORTC)), [ptr] "e"(ptr), [hi] "r"(hi),
|
|
[lo] "r"(lo));
|
|
|
|
#if defined(PORTD) || defined(PORTB) || defined(PORTF)
|
|
}
|
|
#endif // defined(PORTD/B/F)
|
|
#if defined(PORTF)
|
|
else
|
|
#endif
|
|
#endif // defined(PORTC)
|
|
|
|
// PORTF OUTPUT ----------------------------------------------------
|
|
|
|
#if defined(PORTF)
|
|
#if defined(PORTD) || defined(PORTB) || defined(PORTC)
|
|
if (port == &PORTF) {
|
|
#endif // defined(PORTD/B/C)
|
|
|
|
hi = PORTF | pinMask;
|
|
lo = PORTF & ~pinMask;
|
|
n1 = lo;
|
|
if (b & 0x80)
|
|
n1 = hi;
|
|
|
|
asm volatile(
|
|
"headF:"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"mov %[n2] , %[lo]"
|
|
"\n\t"
|
|
"out %[port] , %[n1]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"sbrc %[byte] , 6"
|
|
"\n\t"
|
|
"mov %[n2] , %[hi]"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"mov %[n1] , %[lo]"
|
|
"\n\t"
|
|
"out %[port] , %[n2]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"sbrc %[byte] , 5"
|
|
"\n\t"
|
|
"mov %[n1] , %[hi]"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"mov %[n2] , %[lo]"
|
|
"\n\t"
|
|
"out %[port] , %[n1]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"sbrc %[byte] , 4"
|
|
"\n\t"
|
|
"mov %[n2] , %[hi]"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"mov %[n1] , %[lo]"
|
|
"\n\t"
|
|
"out %[port] , %[n2]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"sbrc %[byte] , 3"
|
|
"\n\t"
|
|
"mov %[n1] , %[hi]"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"mov %[n2] , %[lo]"
|
|
"\n\t"
|
|
"out %[port] , %[n1]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"sbrc %[byte] , 2"
|
|
"\n\t"
|
|
"mov %[n2] , %[hi]"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"mov %[n1] , %[lo]"
|
|
"\n\t"
|
|
"out %[port] , %[n2]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"sbrc %[byte] , 1"
|
|
"\n\t"
|
|
"mov %[n1] , %[hi]"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"mov %[n2] , %[lo]"
|
|
"\n\t"
|
|
"out %[port] , %[n1]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"sbrc %[byte] , 0"
|
|
"\n\t"
|
|
"mov %[n2] , %[hi]"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"sbiw %[count], 1"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"mov %[n1] , %[lo]"
|
|
"\n\t"
|
|
"out %[port] , %[n2]"
|
|
"\n\t"
|
|
"ld %[byte] , %a[ptr]+"
|
|
"\n\t"
|
|
"sbrc %[byte] , 7"
|
|
"\n\t"
|
|
"mov %[n1] , %[hi]"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"brne headF"
|
|
"\n"
|
|
: [byte] "+r"(b), [n1] "+r"(n1), [n2] "+r"(n2), [count] "+w"(i)
|
|
: [port] "I"(_SFR_IO_ADDR(PORTF)), [ptr] "e"(ptr), [hi] "r"(hi),
|
|
[lo] "r"(lo));
|
|
|
|
#if defined(PORTD) || defined(PORTB) || defined(PORTC)
|
|
}
|
|
#endif // defined(PORTD/B/C)
|
|
#endif // defined(PORTF)
|
|
|
|
#if defined(NEO_KHZ400)
|
|
} else { // end 800 KHz, do 400 KHz
|
|
|
|
// Timing is more relaxed; unrolling the inner loop for each bit is
|
|
// not necessary. Still using the peculiar RJMPs as 2X NOPs, not out
|
|
// of need but just to trim the code size down a little.
|
|
// This 400-KHz-datastream-on-8-MHz-CPU code is not quite identical
|
|
// to the 800-on-16 code later -- the hi/lo timing between WS2811 and
|
|
// WS2812 is not simply a 2:1 scale!
|
|
|
|
// 20 inst. clocks per bit: HHHHxxxxxxLLLLLLLLLL
|
|
// ST instructions: ^ ^ ^ (T=0,4,10)
|
|
|
|
volatile uint8_t next, bit;
|
|
|
|
hi = *port | pinMask;
|
|
lo = *port & ~pinMask;
|
|
next = lo;
|
|
bit = 8;
|
|
|
|
asm volatile("head20:"
|
|
"\n\t" // Clk Pseudocode (T = 0)
|
|
"st %a[port], %[hi]"
|
|
"\n\t" // 2 PORT = hi (T = 2)
|
|
"sbrc %[byte] , 7"
|
|
"\n\t" // 1-2 if(b & 128)
|
|
"mov %[next], %[hi]"
|
|
"\n\t" // 0-1 next = hi (T = 4)
|
|
"st %a[port], %[next]"
|
|
"\n\t" // 2 PORT = next (T = 6)
|
|
"mov %[next] , %[lo]"
|
|
"\n\t" // 1 next = lo (T = 7)
|
|
"dec %[bit]"
|
|
"\n\t" // 1 bit-- (T = 8)
|
|
"breq nextbyte20"
|
|
"\n\t" // 1-2 if(bit == 0)
|
|
"rol %[byte]"
|
|
"\n\t" // 1 b <<= 1 (T = 10)
|
|
"st %a[port], %[lo]"
|
|
"\n\t" // 2 PORT = lo (T = 12)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 14)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 16)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 18)
|
|
"rjmp head20"
|
|
"\n\t" // 2 -> head20 (next bit out)
|
|
"nextbyte20:"
|
|
"\n\t" // (T = 10)
|
|
"st %a[port], %[lo]"
|
|
"\n\t" // 2 PORT = lo (T = 12)
|
|
"nop"
|
|
"\n\t" // 1 nop (T = 13)
|
|
"ldi %[bit] , 8"
|
|
"\n\t" // 1 bit = 8 (T = 14)
|
|
"ld %[byte] , %a[ptr]+"
|
|
"\n\t" // 2 b = *ptr++ (T = 16)
|
|
"sbiw %[count], 1"
|
|
"\n\t" // 2 i-- (T = 18)
|
|
"brne head20"
|
|
"\n" // 2 if(i != 0) -> (next byte)
|
|
: [port] "+e"(port), [byte] "+r"(b), [bit] "+r"(bit),
|
|
[next] "+r"(next), [count] "+w"(i)
|
|
: [hi] "r"(hi), [lo] "r"(lo), [ptr] "e"(ptr));
|
|
}
|
|
#endif // NEO_KHZ400
|
|
|
|
// 12 MHz(ish) AVR --------------------------------------------------------
|
|
#elif (F_CPU >= 11100000UL) && (F_CPU <= 14300000UL)
|
|
|
|
#if defined(NEO_KHZ400) // 800 KHz check needed only if 400 KHz support enabled
|
|
if (is800KHz) {
|
|
#endif
|
|
|
|
// In the 12 MHz case, an optimized 800 KHz datastream (no dead time
|
|
// between bytes) requires a PORT-specific loop similar to the 8 MHz
|
|
// code (but a little more relaxed in this case).
|
|
|
|
// 15 instruction clocks per bit: HHHHxxxxxxLLLLL
|
|
// OUT instructions: ^ ^ ^ (T=0,4,10)
|
|
|
|
volatile uint8_t next;
|
|
|
|
// PORTD OUTPUT ----------------------------------------------------
|
|
|
|
#if defined(PORTD)
|
|
#if defined(PORTB) || defined(PORTC) || defined(PORTF)
|
|
if (port == &PORTD) {
|
|
#endif // defined(PORTB/C/F)
|
|
|
|
hi = PORTD | pinMask;
|
|
lo = PORTD & ~pinMask;
|
|
next = lo;
|
|
if (b & 0x80)
|
|
next = hi;
|
|
|
|
// Don't "optimize" the OUT calls into the bitTime subroutine;
|
|
// we're exploiting the RCALL and RET as 3- and 4-cycle NOPs!
|
|
asm volatile("headD:"
|
|
"\n\t" // (T = 0)
|
|
"out %[port], %[hi]"
|
|
"\n\t" // (T = 1)
|
|
"rcall bitTimeD"
|
|
"\n\t" // Bit 7 (T = 15)
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeD"
|
|
"\n\t" // Bit 6
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeD"
|
|
"\n\t" // Bit 5
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeD"
|
|
"\n\t" // Bit 4
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeD"
|
|
"\n\t" // Bit 3
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeD"
|
|
"\n\t" // Bit 2
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeD"
|
|
"\n\t" // Bit 1
|
|
// Bit 0:
|
|
"out %[port] , %[hi]"
|
|
"\n\t" // 1 PORT = hi (T = 1)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 3)
|
|
"ld %[byte] , %a[ptr]+"
|
|
"\n\t" // 2 b = *ptr++ (T = 5)
|
|
"out %[port] , %[next]"
|
|
"\n\t" // 1 PORT = next (T = 6)
|
|
"mov %[next] , %[lo]"
|
|
"\n\t" // 1 next = lo (T = 7)
|
|
"sbrc %[byte] , 7"
|
|
"\n\t" // 1-2 if(b & 0x80) (T = 8)
|
|
"mov %[next] , %[hi]"
|
|
"\n\t" // 0-1 next = hi (T = 9)
|
|
"nop"
|
|
"\n\t" // 1 (T = 10)
|
|
"out %[port] , %[lo]"
|
|
"\n\t" // 1 PORT = lo (T = 11)
|
|
"sbiw %[count], 1"
|
|
"\n\t" // 2 i-- (T = 13)
|
|
"brne headD"
|
|
"\n\t" // 2 if(i != 0) -> (next byte)
|
|
"rjmp doneD"
|
|
"\n\t"
|
|
"bitTimeD:"
|
|
"\n\t" // nop nop nop (T = 4)
|
|
"out %[port], %[next]"
|
|
"\n\t" // 1 PORT = next (T = 5)
|
|
"mov %[next], %[lo]"
|
|
"\n\t" // 1 next = lo (T = 6)
|
|
"rol %[byte]"
|
|
"\n\t" // 1 b <<= 1 (T = 7)
|
|
"sbrc %[byte], 7"
|
|
"\n\t" // 1-2 if(b & 0x80) (T = 8)
|
|
"mov %[next], %[hi]"
|
|
"\n\t" // 0-1 next = hi (T = 9)
|
|
"nop"
|
|
"\n\t" // 1 (T = 10)
|
|
"out %[port], %[lo]"
|
|
"\n\t" // 1 PORT = lo (T = 11)
|
|
"ret"
|
|
"\n\t" // 4 nop nop nop nop (T = 15)
|
|
"doneD:"
|
|
"\n"
|
|
: [byte] "+r"(b), [next] "+r"(next), [count] "+w"(i)
|
|
: [port] "I"(_SFR_IO_ADDR(PORTD)), [ptr] "e"(ptr),
|
|
[hi] "r"(hi), [lo] "r"(lo));
|
|
|
|
#if defined(PORTB) || defined(PORTC) || defined(PORTF)
|
|
} else // other PORT(s)
|
|
#endif // defined(PORTB/C/F)
|
|
#endif // defined(PORTD)
|
|
|
|
// PORTB OUTPUT ----------------------------------------------------
|
|
|
|
#if defined(PORTB)
|
|
#if defined(PORTD) || defined(PORTC) || defined(PORTF)
|
|
if (port == &PORTB) {
|
|
#endif // defined(PORTD/C/F)
|
|
|
|
hi = PORTB | pinMask;
|
|
lo = PORTB & ~pinMask;
|
|
next = lo;
|
|
if (b & 0x80)
|
|
next = hi;
|
|
|
|
// Same as above, just set for PORTB & stripped of comments
|
|
asm volatile("headB:"
|
|
"\n\t"
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeB"
|
|
"\n\t"
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeB"
|
|
"\n\t"
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeB"
|
|
"\n\t"
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeB"
|
|
"\n\t"
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeB"
|
|
"\n\t"
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeB"
|
|
"\n\t"
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeB"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"ld %[byte] , %a[ptr]+"
|
|
"\n\t"
|
|
"out %[port] , %[next]"
|
|
"\n\t"
|
|
"mov %[next] , %[lo]"
|
|
"\n\t"
|
|
"sbrc %[byte] , 7"
|
|
"\n\t"
|
|
"mov %[next] , %[hi]"
|
|
"\n\t"
|
|
"nop"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"sbiw %[count], 1"
|
|
"\n\t"
|
|
"brne headB"
|
|
"\n\t"
|
|
"rjmp doneB"
|
|
"\n\t"
|
|
"bitTimeB:"
|
|
"\n\t"
|
|
"out %[port], %[next]"
|
|
"\n\t"
|
|
"mov %[next], %[lo]"
|
|
"\n\t"
|
|
"rol %[byte]"
|
|
"\n\t"
|
|
"sbrc %[byte], 7"
|
|
"\n\t"
|
|
"mov %[next], %[hi]"
|
|
"\n\t"
|
|
"nop"
|
|
"\n\t"
|
|
"out %[port], %[lo]"
|
|
"\n\t"
|
|
"ret"
|
|
"\n\t"
|
|
"doneB:"
|
|
"\n"
|
|
: [byte] "+r"(b), [next] "+r"(next), [count] "+w"(i)
|
|
: [port] "I"(_SFR_IO_ADDR(PORTB)), [ptr] "e"(ptr),
|
|
[hi] "r"(hi), [lo] "r"(lo));
|
|
|
|
#if defined(PORTD) || defined(PORTC) || defined(PORTF)
|
|
}
|
|
#endif
|
|
#if defined(PORTC) || defined(PORTF)
|
|
else
|
|
#endif // defined(PORTC/F)
|
|
#endif // defined(PORTB)
|
|
|
|
// PORTC OUTPUT ----------------------------------------------------
|
|
|
|
#if defined(PORTC)
|
|
#if defined(PORTD) || defined(PORTB) || defined(PORTF)
|
|
if (port == &PORTC) {
|
|
#endif // defined(PORTD/B/F)
|
|
|
|
hi = PORTC | pinMask;
|
|
lo = PORTC & ~pinMask;
|
|
next = lo;
|
|
if (b & 0x80)
|
|
next = hi;
|
|
|
|
// Same as above, just set for PORTC & stripped of comments
|
|
asm volatile("headC:"
|
|
"\n\t"
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeC"
|
|
"\n\t"
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeC"
|
|
"\n\t"
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeC"
|
|
"\n\t"
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeC"
|
|
"\n\t"
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeC"
|
|
"\n\t"
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeC"
|
|
"\n\t"
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeC"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"ld %[byte] , %a[ptr]+"
|
|
"\n\t"
|
|
"out %[port] , %[next]"
|
|
"\n\t"
|
|
"mov %[next] , %[lo]"
|
|
"\n\t"
|
|
"sbrc %[byte] , 7"
|
|
"\n\t"
|
|
"mov %[next] , %[hi]"
|
|
"\n\t"
|
|
"nop"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"sbiw %[count], 1"
|
|
"\n\t"
|
|
"brne headC"
|
|
"\n\t"
|
|
"rjmp doneC"
|
|
"\n\t"
|
|
"bitTimeC:"
|
|
"\n\t"
|
|
"out %[port], %[next]"
|
|
"\n\t"
|
|
"mov %[next], %[lo]"
|
|
"\n\t"
|
|
"rol %[byte]"
|
|
"\n\t"
|
|
"sbrc %[byte], 7"
|
|
"\n\t"
|
|
"mov %[next], %[hi]"
|
|
"\n\t"
|
|
"nop"
|
|
"\n\t"
|
|
"out %[port], %[lo]"
|
|
"\n\t"
|
|
"ret"
|
|
"\n\t"
|
|
"doneC:"
|
|
"\n"
|
|
: [byte] "+r"(b), [next] "+r"(next), [count] "+w"(i)
|
|
: [port] "I"(_SFR_IO_ADDR(PORTC)), [ptr] "e"(ptr),
|
|
[hi] "r"(hi), [lo] "r"(lo));
|
|
|
|
#if defined(PORTD) || defined(PORTB) || defined(PORTF)
|
|
}
|
|
#endif // defined(PORTD/B/F)
|
|
#if defined(PORTF)
|
|
else
|
|
#endif
|
|
#endif // defined(PORTC)
|
|
|
|
// PORTF OUTPUT ----------------------------------------------------
|
|
|
|
#if defined(PORTF)
|
|
#if defined(PORTD) || defined(PORTB) || defined(PORTC)
|
|
if (port == &PORTF) {
|
|
#endif // defined(PORTD/B/C)
|
|
|
|
hi = PORTF | pinMask;
|
|
lo = PORTF & ~pinMask;
|
|
next = lo;
|
|
if (b & 0x80)
|
|
next = hi;
|
|
|
|
// Same as above, just set for PORTF & stripped of comments
|
|
asm volatile("headF:"
|
|
"\n\t"
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeC"
|
|
"\n\t"
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeC"
|
|
"\n\t"
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeC"
|
|
"\n\t"
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeC"
|
|
"\n\t"
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeC"
|
|
"\n\t"
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeC"
|
|
"\n\t"
|
|
"out %[port], %[hi]"
|
|
"\n\t"
|
|
"rcall bitTimeC"
|
|
"\n\t"
|
|
"out %[port] , %[hi]"
|
|
"\n\t"
|
|
"rjmp .+0"
|
|
"\n\t"
|
|
"ld %[byte] , %a[ptr]+"
|
|
"\n\t"
|
|
"out %[port] , %[next]"
|
|
"\n\t"
|
|
"mov %[next] , %[lo]"
|
|
"\n\t"
|
|
"sbrc %[byte] , 7"
|
|
"\n\t"
|
|
"mov %[next] , %[hi]"
|
|
"\n\t"
|
|
"nop"
|
|
"\n\t"
|
|
"out %[port] , %[lo]"
|
|
"\n\t"
|
|
"sbiw %[count], 1"
|
|
"\n\t"
|
|
"brne headF"
|
|
"\n\t"
|
|
"rjmp doneC"
|
|
"\n\t"
|
|
"bitTimeC:"
|
|
"\n\t"
|
|
"out %[port], %[next]"
|
|
"\n\t"
|
|
"mov %[next], %[lo]"
|
|
"\n\t"
|
|
"rol %[byte]"
|
|
"\n\t"
|
|
"sbrc %[byte], 7"
|
|
"\n\t"
|
|
"mov %[next], %[hi]"
|
|
"\n\t"
|
|
"nop"
|
|
"\n\t"
|
|
"out %[port], %[lo]"
|
|
"\n\t"
|
|
"ret"
|
|
"\n\t"
|
|
"doneC:"
|
|
"\n"
|
|
: [byte] "+r"(b), [next] "+r"(next), [count] "+w"(i)
|
|
: [port] "I"(_SFR_IO_ADDR(PORTF)), [ptr] "e"(ptr),
|
|
[hi] "r"(hi), [lo] "r"(lo));
|
|
|
|
#if defined(PORTD) || defined(PORTB) || defined(PORTC)
|
|
}
|
|
#endif // defined(PORTD/B/C)
|
|
#endif // defined(PORTF)
|
|
|
|
#if defined(NEO_KHZ400)
|
|
} else { // 400 KHz
|
|
|
|
// 30 instruction clocks per bit: HHHHHHxxxxxxxxxLLLLLLLLLLLLLLL
|
|
// ST instructions: ^ ^ ^ (T=0,6,15)
|
|
|
|
volatile uint8_t next, bit;
|
|
|
|
hi = *port | pinMask;
|
|
lo = *port & ~pinMask;
|
|
next = lo;
|
|
bit = 8;
|
|
|
|
asm volatile("head30:"
|
|
"\n\t" // Clk Pseudocode (T = 0)
|
|
"st %a[port], %[hi]"
|
|
"\n\t" // 2 PORT = hi (T = 2)
|
|
"sbrc %[byte] , 7"
|
|
"\n\t" // 1-2 if(b & 128)
|
|
"mov %[next], %[hi]"
|
|
"\n\t" // 0-1 next = hi (T = 4)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 6)
|
|
"st %a[port], %[next]"
|
|
"\n\t" // 2 PORT = next (T = 8)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 10)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 12)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 14)
|
|
"nop"
|
|
"\n\t" // 1 nop (T = 15)
|
|
"st %a[port], %[lo]"
|
|
"\n\t" // 2 PORT = lo (T = 17)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 19)
|
|
"dec %[bit]"
|
|
"\n\t" // 1 bit-- (T = 20)
|
|
"breq nextbyte30"
|
|
"\n\t" // 1-2 if(bit == 0)
|
|
"rol %[byte]"
|
|
"\n\t" // 1 b <<= 1 (T = 22)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 24)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 26)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 28)
|
|
"rjmp head30"
|
|
"\n\t" // 2 -> head30 (next bit out)
|
|
"nextbyte30:"
|
|
"\n\t" // (T = 22)
|
|
"nop"
|
|
"\n\t" // 1 nop (T = 23)
|
|
"ldi %[bit] , 8"
|
|
"\n\t" // 1 bit = 8 (T = 24)
|
|
"ld %[byte] , %a[ptr]+"
|
|
"\n\t" // 2 b = *ptr++ (T = 26)
|
|
"sbiw %[count], 1"
|
|
"\n\t" // 2 i-- (T = 28)
|
|
"brne head30"
|
|
"\n" // 1-2 if(i != 0) -> (next byte)
|
|
: [port] "+e"(port), [byte] "+r"(b), [bit] "+r"(bit),
|
|
[next] "+r"(next), [count] "+w"(i)
|
|
: [hi] "r"(hi), [lo] "r"(lo), [ptr] "e"(ptr));
|
|
}
|
|
#endif // NEO_KHZ400
|
|
|
|
// 16 MHz(ish) AVR --------------------------------------------------------
|
|
#elif (F_CPU >= 15400000UL) && (F_CPU <= 19000000L)
|
|
|
|
#if defined(NEO_KHZ400) // 800 KHz check needed only if 400 KHz support enabled
|
|
if (is800KHz) {
|
|
#endif
|
|
|
|
// WS2811 and WS2812 have different hi/lo duty cycles; this is
|
|
// similar but NOT an exact copy of the prior 400-on-8 code.
|
|
|
|
// 20 inst. clocks per bit: HHHHHxxxxxxxxLLLLLLL
|
|
// ST instructions: ^ ^ ^ (T=0,5,13)
|
|
|
|
volatile uint8_t next, bit;
|
|
|
|
hi = *port | pinMask;
|
|
lo = *port & ~pinMask;
|
|
next = lo;
|
|
bit = 8;
|
|
|
|
asm volatile("head20:"
|
|
"\n\t" // Clk Pseudocode (T = 0)
|
|
"st %a[port], %[hi]"
|
|
"\n\t" // 2 PORT = hi (T = 2)
|
|
"sbrc %[byte], 7"
|
|
"\n\t" // 1-2 if(b & 128)
|
|
"mov %[next], %[hi]"
|
|
"\n\t" // 0-1 next = hi (T = 4)
|
|
"dec %[bit]"
|
|
"\n\t" // 1 bit-- (T = 5)
|
|
"st %a[port], %[next]"
|
|
"\n\t" // 2 PORT = next (T = 7)
|
|
"mov %[next] , %[lo]"
|
|
"\n\t" // 1 next = lo (T = 8)
|
|
"breq nextbyte20"
|
|
"\n\t" // 1-2 if(bit == 0) (from dec above)
|
|
"rol %[byte]"
|
|
"\n\t" // 1 b <<= 1 (T = 10)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 12)
|
|
"nop"
|
|
"\n\t" // 1 nop (T = 13)
|
|
"st %a[port], %[lo]"
|
|
"\n\t" // 2 PORT = lo (T = 15)
|
|
"nop"
|
|
"\n\t" // 1 nop (T = 16)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 18)
|
|
"rjmp head20"
|
|
"\n\t" // 2 -> head20 (next bit out)
|
|
"nextbyte20:"
|
|
"\n\t" // (T = 10)
|
|
"ldi %[bit] , 8"
|
|
"\n\t" // 1 bit = 8 (T = 11)
|
|
"ld %[byte] , %a[ptr]+"
|
|
"\n\t" // 2 b = *ptr++ (T = 13)
|
|
"st %a[port], %[lo]"
|
|
"\n\t" // 2 PORT = lo (T = 15)
|
|
"nop"
|
|
"\n\t" // 1 nop (T = 16)
|
|
"sbiw %[count], 1"
|
|
"\n\t" // 2 i-- (T = 18)
|
|
"brne head20"
|
|
"\n" // 2 if(i != 0) -> (next byte)
|
|
: [port] "+e"(port), [byte] "+r"(b), [bit] "+r"(bit),
|
|
[next] "+r"(next), [count] "+w"(i)
|
|
: [ptr] "e"(ptr), [hi] "r"(hi), [lo] "r"(lo));
|
|
|
|
#if defined(NEO_KHZ400)
|
|
} else { // 400 KHz
|
|
|
|
// The 400 KHz clock on 16 MHz MCU is the most 'relaxed' version.
|
|
|
|
// 40 inst. clocks per bit: HHHHHHHHxxxxxxxxxxxxLLLLLLLLLLLLLLLLLLLL
|
|
// ST instructions: ^ ^ ^ (T=0,8,20)
|
|
|
|
volatile uint8_t next, bit;
|
|
|
|
hi = *port | pinMask;
|
|
lo = *port & ~pinMask;
|
|
next = lo;
|
|
bit = 8;
|
|
|
|
asm volatile("head40:"
|
|
"\n\t" // Clk Pseudocode (T = 0)
|
|
"st %a[port], %[hi]"
|
|
"\n\t" // 2 PORT = hi (T = 2)
|
|
"sbrc %[byte] , 7"
|
|
"\n\t" // 1-2 if(b & 128)
|
|
"mov %[next] , %[hi]"
|
|
"\n\t" // 0-1 next = hi (T = 4)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 6)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 8)
|
|
"st %a[port], %[next]"
|
|
"\n\t" // 2 PORT = next (T = 10)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 12)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 14)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 16)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 18)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 20)
|
|
"st %a[port], %[lo]"
|
|
"\n\t" // 2 PORT = lo (T = 22)
|
|
"nop"
|
|
"\n\t" // 1 nop (T = 23)
|
|
"mov %[next] , %[lo]"
|
|
"\n\t" // 1 next = lo (T = 24)
|
|
"dec %[bit]"
|
|
"\n\t" // 1 bit-- (T = 25)
|
|
"breq nextbyte40"
|
|
"\n\t" // 1-2 if(bit == 0)
|
|
"rol %[byte]"
|
|
"\n\t" // 1 b <<= 1 (T = 27)
|
|
"nop"
|
|
"\n\t" // 1 nop (T = 28)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 30)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 32)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 34)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 36)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 38)
|
|
"rjmp head40"
|
|
"\n\t" // 2 -> head40 (next bit out)
|
|
"nextbyte40:"
|
|
"\n\t" // (T = 27)
|
|
"ldi %[bit] , 8"
|
|
"\n\t" // 1 bit = 8 (T = 28)
|
|
"ld %[byte] , %a[ptr]+"
|
|
"\n\t" // 2 b = *ptr++ (T = 30)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 32)
|
|
"st %a[port], %[lo]"
|
|
"\n\t" // 2 PORT = lo (T = 34)
|
|
"rjmp .+0"
|
|
"\n\t" // 2 nop nop (T = 36)
|
|
"sbiw %[count], 1"
|
|
"\n\t" // 2 i-- (T = 38)
|
|
"brne head40"
|
|
"\n" // 1-2 if(i != 0) -> (next byte)
|
|
: [port] "+e"(port), [byte] "+r"(b), [bit] "+r"(bit),
|
|
[next] "+r"(next), [count] "+w"(i)
|
|
: [ptr] "e"(ptr), [hi] "r"(hi), [lo] "r"(lo));
|
|
}
|
|
#endif // NEO_KHZ400
|
|
|
|
#else
|
|
#error "CPU SPEED NOT SUPPORTED"
|
|
#endif // end F_CPU ifdefs on __AVR__
|
|
|
|
// END AVR ----------------------------------------------------------------
|
|
|
|
#elif defined(__arm__)
|
|
|
|
// ARM MCUs -- Teensy 3.0, 3.1, LC, Arduino Due, RP2040 -------------------
|
|
|
|
#if defined(ARDUINO_ARCH_RP2040)
|
|
// Use PIO
|
|
rp2040Show(pin, pixels, numBytes, is800KHz);
|
|
|
|
#elif defined(TEENSYDUINO) && \
|
|
defined(KINETISK) // Teensy 3.0, 3.1, 3.2, 3.5, 3.6
|
|
#define CYCLES_800_T0H (F_CPU / 4000000)
|
|
#define CYCLES_800_T1H (F_CPU / 1250000)
|
|
#define CYCLES_800 (F_CPU / 800000)
|
|
#define CYCLES_400_T0H (F_CPU / 2000000)
|
|
#define CYCLES_400_T1H (F_CPU / 833333)
|
|
#define CYCLES_400 (F_CPU / 400000)
|
|
|
|
uint8_t *p = pixels, *end = p + numBytes, pix, mask;
|
|
volatile uint8_t *set = portSetRegister(pin), *clr = portClearRegister(pin);
|
|
uint32_t cyc;
|
|
|
|
ARM_DEMCR |= ARM_DEMCR_TRCENA;
|
|
ARM_DWT_CTRL |= ARM_DWT_CTRL_CYCCNTENA;
|
|
|
|
#if defined(NEO_KHZ400) // 800 KHz check needed only if 400 KHz support enabled
|
|
if (is800KHz) {
|
|
#endif
|
|
cyc = ARM_DWT_CYCCNT + CYCLES_800;
|
|
while (p < end) {
|
|
pix = *p++;
|
|
for (mask = 0x80; mask; mask >>= 1) {
|
|
while (ARM_DWT_CYCCNT - cyc < CYCLES_800)
|
|
;
|
|
cyc = ARM_DWT_CYCCNT;
|
|
*set = 1;
|
|
if (pix & mask) {
|
|
while (ARM_DWT_CYCCNT - cyc < CYCLES_800_T1H)
|
|
;
|
|
} else {
|
|
while (ARM_DWT_CYCCNT - cyc < CYCLES_800_T0H)
|
|
;
|
|
}
|
|
*clr = 1;
|
|
}
|
|
}
|
|
while (ARM_DWT_CYCCNT - cyc < CYCLES_800)
|
|
;
|
|
#if defined(NEO_KHZ400)
|
|
} else { // 400 kHz bitstream
|
|
cyc = ARM_DWT_CYCCNT + CYCLES_400;
|
|
while (p < end) {
|
|
pix = *p++;
|
|
for (mask = 0x80; mask; mask >>= 1) {
|
|
while (ARM_DWT_CYCCNT - cyc < CYCLES_400)
|
|
;
|
|
cyc = ARM_DWT_CYCCNT;
|
|
*set = 1;
|
|
if (pix & mask) {
|
|
while (ARM_DWT_CYCCNT - cyc < CYCLES_400_T1H)
|
|
;
|
|
} else {
|
|
while (ARM_DWT_CYCCNT - cyc < CYCLES_400_T0H)
|
|
;
|
|
}
|
|
*clr = 1;
|
|
}
|
|
}
|
|
while (ARM_DWT_CYCCNT - cyc < CYCLES_400)
|
|
;
|
|
}
|
|
#endif // NEO_KHZ400
|
|
|
|
#elif defined(TEENSYDUINO) && (defined(__IMXRT1052__) || defined(__IMXRT1062__))
|
|
#define CYCLES_800_T0H (F_CPU_ACTUAL / 4000000)
|
|
#define CYCLES_800_T1H (F_CPU_ACTUAL / 1250000)
|
|
#define CYCLES_800 (F_CPU_ACTUAL / 800000)
|
|
#define CYCLES_400_T0H (F_CPU_ACTUAL / 2000000)
|
|
#define CYCLES_400_T1H (F_CPU_ACTUAL / 833333)
|
|
#define CYCLES_400 (F_CPU_ACTUAL / 400000)
|
|
|
|
uint8_t *p = pixels, *end = p + numBytes, pix, mask;
|
|
volatile uint32_t *set = portSetRegister(pin), *clr = portClearRegister(pin);
|
|
uint32_t cyc, msk = digitalPinToBitMask(pin);
|
|
|
|
ARM_DEMCR |= ARM_DEMCR_TRCENA;
|
|
ARM_DWT_CTRL |= ARM_DWT_CTRL_CYCCNTENA;
|
|
|
|
#if defined(NEO_KHZ400) // 800 KHz check needed only if 400 KHz support enabled
|
|
if (is800KHz) {
|
|
#endif
|
|
cyc = ARM_DWT_CYCCNT + CYCLES_800;
|
|
while (p < end) {
|
|
pix = *p++;
|
|
for (mask = 0x80; mask; mask >>= 1) {
|
|
while (ARM_DWT_CYCCNT - cyc < CYCLES_800)
|
|
;
|
|
cyc = ARM_DWT_CYCCNT;
|
|
*set = msk;
|
|
if (pix & mask) {
|
|
while (ARM_DWT_CYCCNT - cyc < CYCLES_800_T1H)
|
|
;
|
|
} else {
|
|
while (ARM_DWT_CYCCNT - cyc < CYCLES_800_T0H)
|
|
;
|
|
}
|
|
*clr = msk;
|
|
}
|
|
}
|
|
while (ARM_DWT_CYCCNT - cyc < CYCLES_800)
|
|
;
|
|
#if defined(NEO_KHZ400)
|
|
} else { // 400 kHz bitstream
|
|
cyc = ARM_DWT_CYCCNT + CYCLES_400;
|
|
while (p < end) {
|
|
pix = *p++;
|
|
for (mask = 0x80; mask; mask >>= 1) {
|
|
while (ARM_DWT_CYCCNT - cyc < CYCLES_400)
|
|
;
|
|
cyc = ARM_DWT_CYCCNT;
|
|
*set = msk;
|
|
if (pix & mask) {
|
|
while (ARM_DWT_CYCCNT - cyc < CYCLES_400_T1H)
|
|
;
|
|
} else {
|
|
while (ARM_DWT_CYCCNT - cyc < CYCLES_400_T0H)
|
|
;
|
|
}
|
|
*clr = msk;
|
|
}
|
|
}
|
|
while (ARM_DWT_CYCCNT - cyc < CYCLES_400)
|
|
;
|
|
}
|
|
#endif // NEO_KHZ400
|
|
|
|
#elif defined(TEENSYDUINO) && defined(__MKL26Z64__) // Teensy-LC
|
|
|
|
#if F_CPU == 48000000
|
|
uint8_t *p = pixels, pix, count, dly, bitmask = digitalPinToBitMask(pin);
|
|
volatile uint8_t *reg = portSetRegister(pin);
|
|
uint32_t num = numBytes;
|
|
asm volatile("L%=_begin:"
|
|
"\n\t"
|
|
"ldrb %[pix], [%[p], #0]"
|
|
"\n\t"
|
|
"lsl %[pix], #24"
|
|
"\n\t"
|
|
"movs %[count], #7"
|
|
"\n\t"
|
|
"L%=_loop:"
|
|
"\n\t"
|
|
"lsl %[pix], #1"
|
|
"\n\t"
|
|
"bcs L%=_loop_one"
|
|
"\n\t"
|
|
"L%=_loop_zero:"
|
|
"\n\t"
|
|
"strb %[bitmask], [%[reg], #0]"
|
|
"\n\t"
|
|
"movs %[dly], #4"
|
|
"\n\t"
|
|
"L%=_loop_delay_T0H:"
|
|
"\n\t"
|
|
"sub %[dly], #1"
|
|
"\n\t"
|
|
"bne L%=_loop_delay_T0H"
|
|
"\n\t"
|
|
"strb %[bitmask], [%[reg], #4]"
|
|
"\n\t"
|
|
"movs %[dly], #13"
|
|
"\n\t"
|
|
"L%=_loop_delay_T0L:"
|
|
"\n\t"
|
|
"sub %[dly], #1"
|
|
"\n\t"
|
|
"bne L%=_loop_delay_T0L"
|
|
"\n\t"
|
|
"b L%=_next"
|
|
"\n\t"
|
|
"L%=_loop_one:"
|
|
"\n\t"
|
|
"strb %[bitmask], [%[reg], #0]"
|
|
"\n\t"
|
|
"movs %[dly], #13"
|
|
"\n\t"
|
|
"L%=_loop_delay_T1H:"
|
|
"\n\t"
|
|
"sub %[dly], #1"
|
|
"\n\t"
|
|
"bne L%=_loop_delay_T1H"
|
|
"\n\t"
|
|
"strb %[bitmask], [%[reg], #4]"
|
|
"\n\t"
|
|
"movs %[dly], #4"
|
|
"\n\t"
|
|
"L%=_loop_delay_T1L:"
|
|
"\n\t"
|
|
"sub %[dly], #1"
|
|
"\n\t"
|
|
"bne L%=_loop_delay_T1L"
|
|
"\n\t"
|
|
"nop"
|
|
"\n\t"
|
|
"L%=_next:"
|
|
"\n\t"
|
|
"sub %[count], #1"
|
|
"\n\t"
|
|
"bne L%=_loop"
|
|
"\n\t"
|
|
"lsl %[pix], #1"
|
|
"\n\t"
|
|
"bcs L%=_last_one"
|
|
"\n\t"
|
|
"L%=_last_zero:"
|
|
"\n\t"
|
|
"strb %[bitmask], [%[reg], #0]"
|
|
"\n\t"
|
|
"movs %[dly], #4"
|
|
"\n\t"
|
|
"L%=_last_delay_T0H:"
|
|
"\n\t"
|
|
"sub %[dly], #1"
|
|
"\n\t"
|
|
"bne L%=_last_delay_T0H"
|
|
"\n\t"
|
|
"strb %[bitmask], [%[reg], #4]"
|
|
"\n\t"
|
|
"movs %[dly], #10"
|
|
"\n\t"
|
|
"L%=_last_delay_T0L:"
|
|
"\n\t"
|
|
"sub %[dly], #1"
|
|
"\n\t"
|
|
"bne L%=_last_delay_T0L"
|
|
"\n\t"
|
|
"b L%=_repeat"
|
|
"\n\t"
|
|
"L%=_last_one:"
|
|
"\n\t"
|
|
"strb %[bitmask], [%[reg], #0]"
|
|
"\n\t"
|
|
"movs %[dly], #13"
|
|
"\n\t"
|
|
"L%=_last_delay_T1H:"
|
|
"\n\t"
|
|
"sub %[dly], #1"
|
|
"\n\t"
|
|
"bne L%=_last_delay_T1H"
|
|
"\n\t"
|
|
"strb %[bitmask], [%[reg], #4]"
|
|
"\n\t"
|
|
"movs %[dly], #1"
|
|
"\n\t"
|
|
"L%=_last_delay_T1L:"
|
|
"\n\t"
|
|
"sub %[dly], #1"
|
|
"\n\t"
|
|
"bne L%=_last_delay_T1L"
|
|
"\n\t"
|
|
"nop"
|
|
"\n\t"
|
|
"L%=_repeat:"
|
|
"\n\t"
|
|
"add %[p], #1"
|
|
"\n\t"
|
|
"sub %[num], #1"
|
|
"\n\t"
|
|
"bne L%=_begin"
|
|
"\n\t"
|
|
"L%=_done:"
|
|
"\n\t"
|
|
: [p] "+r"(p), [pix] "=&r"(pix), [count] "=&r"(count),
|
|
[dly] "=&r"(dly), [num] "+r"(num)
|
|
: [bitmask] "r"(bitmask), [reg] "r"(reg));
|
|
#else
|
|
#error "Sorry, only 48 MHz is supported, please set Tools > CPU Speed to 48 MHz"
|
|
#endif // F_CPU == 48000000
|
|
|
|
// Begin of support for nRF52 based boards -------------------------
|
|
|
|
#elif defined(NRF52) || defined(NRF52_SERIES)
|
|
// [[[Begin of the Neopixel NRF52 EasyDMA implementation
|
|
// by the Hackerspace San Salvador]]]
|
|
// This technique uses the PWM peripheral on the NRF52. The PWM uses the
|
|
// EasyDMA feature included on the chip. This technique loads the duty
|
|
// cycle configuration for each cycle when the PWM is enabled. For this
|
|
// to work we need to store a 16 bit configuration for each bit of the
|
|
// RGB(W) values in the pixel buffer.
|
|
// Comparator values for the PWM were hand picked and are guaranteed to
|
|
// be 100% organic to preserve freshness and high accuracy. Current
|
|
// parameters are:
|
|
// * PWM Clock: 16Mhz
|
|
// * Minimum step time: 62.5ns
|
|
// * Time for zero in high (T0H): 0.31ms
|
|
// * Time for one in high (T1H): 0.75ms
|
|
// * Cycle time: 1.25us
|
|
// * Frequency: 800Khz
|
|
// For 400Khz we just double the calculated times.
|
|
// ---------- BEGIN Constants for the EasyDMA implementation -----------
|
|
// The PWM starts the duty cycle in LOW. To start with HIGH we
|
|
// need to set the 15th bit on each register.
|
|
|
|
// WS2812 (rev A) timing is 0.35 and 0.7us
|
|
//#define MAGIC_T0H 5UL | (0x8000) // 0.3125us
|
|
//#define MAGIC_T1H 12UL | (0x8000) // 0.75us
|
|
|
|
// WS2812B (rev B) timing is 0.4 and 0.8 us
|
|
#define MAGIC_T0H 6UL | (0x8000) // 0.375us
|
|
#define MAGIC_T1H 13UL | (0x8000) // 0.8125us
|
|
|
|
// WS2811 (400 khz) timing is 0.5 and 1.2
|
|
#define MAGIC_T0H_400KHz 8UL | (0x8000) // 0.5us
|
|
#define MAGIC_T1H_400KHz 19UL | (0x8000) // 1.1875us
|
|
|
|
// For 400Khz, we double value of CTOPVAL
|
|
#define CTOPVAL 20UL // 1.25us
|
|
#define CTOPVAL_400KHz 40UL // 2.5us
|
|
|
|
// ---------- END Constants for the EasyDMA implementation -------------
|
|
//
|
|
// If there is no device available an alternative cycle-counter
|
|
// implementation is tried.
|
|
// The nRF52 runs with a fixed clock of 64Mhz. The alternative
|
|
// implementation is the same as the one used for the Teensy 3.0/1/2 but
|
|
// with the Nordic SDK HAL & registers syntax.
|
|
// The number of cycles was hand picked and is guaranteed to be 100%
|
|
// organic to preserve freshness and high accuracy.
|
|
// ---------- BEGIN Constants for cycle counter implementation ---------
|
|
#define CYCLES_800_T0H 18 // ~0.36 uS
|
|
#define CYCLES_800_T1H 41 // ~0.76 uS
|
|
#define CYCLES_800 71 // ~1.25 uS
|
|
|
|
#define CYCLES_400_T0H 26 // ~0.50 uS
|
|
#define CYCLES_400_T1H 70 // ~1.26 uS
|
|
#define CYCLES_400 156 // ~2.50 uS
|
|
// ---------- END of Constants for cycle counter implementation --------
|
|
|
|
// To support both the SoftDevice + Neopixels we use the EasyDMA
|
|
// feature from the NRF25. However this technique implies to
|
|
// generate a pattern and store it on the memory. The actual
|
|
// memory used in bytes corresponds to the following formula:
|
|
// totalMem = numBytes*8*2+(2*2)
|
|
// The two additional bytes at the end are needed to reset the
|
|
// sequence.
|
|
//
|
|
// If there is not enough memory, we will fall back to cycle counter
|
|
// using DWT
|
|
uint32_t pattern_size =
|
|
numBytes * 8 * sizeof(uint16_t) + 2 * sizeof(uint16_t);
|
|
uint16_t *pixels_pattern = NULL;
|
|
|
|
NRF_PWM_Type *pwm = NULL;
|
|
|
|
// Try to find a free PWM device, which is not enabled
|
|
// and has no connected pins
|
|
NRF_PWM_Type *PWM[] = {
|
|
NRF_PWM0,
|
|
NRF_PWM1,
|
|
NRF_PWM2
|
|
#if defined(NRF_PWM3)
|
|
,
|
|
NRF_PWM3
|
|
#endif
|
|
};
|
|
|
|
for (unsigned int device = 0; device < (sizeof(PWM) / sizeof(PWM[0]));
|
|
device++) {
|
|
if ((PWM[device]->ENABLE == 0) &&
|
|
(PWM[device]->PSEL.OUT[0] & PWM_PSEL_OUT_CONNECT_Msk) &&
|
|
(PWM[device]->PSEL.OUT[1] & PWM_PSEL_OUT_CONNECT_Msk) &&
|
|
(PWM[device]->PSEL.OUT[2] & PWM_PSEL_OUT_CONNECT_Msk) &&
|
|
(PWM[device]->PSEL.OUT[3] & PWM_PSEL_OUT_CONNECT_Msk)) {
|
|
pwm = PWM[device];
|
|
break;
|
|
}
|
|
}
|
|
|
|
// only malloc if there is PWM device available
|
|
if (pwm != NULL) {
|
|
#if defined(ARDUINO_NRF52_ADAFRUIT) // use thread-safe malloc
|
|
pixels_pattern = (uint16_t *)rtos_malloc(pattern_size);
|
|
#else
|
|
pixels_pattern = (uint16_t *)malloc(pattern_size);
|
|
#endif
|
|
}
|
|
|
|
// Use the identified device to choose the implementation
|
|
// If a PWM device is available use DMA
|
|
if ((pixels_pattern != NULL) && (pwm != NULL)) {
|
|
uint16_t pos = 0; // bit position
|
|
|
|
for (uint16_t n = 0; n < numBytes; n++) {
|
|
uint8_t pix = pixels[n];
|
|
|
|
for (uint8_t mask = 0x80; mask > 0; mask >>= 1) {
|
|
#if defined(NEO_KHZ400)
|
|
if (!is800KHz) {
|
|
pixels_pattern[pos] =
|
|
(pix & mask) ? MAGIC_T1H_400KHz : MAGIC_T0H_400KHz;
|
|
} else
|
|
#endif
|
|
{
|
|
pixels_pattern[pos] = (pix & mask) ? MAGIC_T1H : MAGIC_T0H;
|
|
}
|
|
|
|
pos++;
|
|
}
|
|
}
|
|
|
|
// Zero padding to indicate the end of que sequence
|
|
pixels_pattern[pos++] = 0 | (0x8000); // Seq end
|
|
pixels_pattern[pos++] = 0 | (0x8000); // Seq end
|
|
|
|
// Set the wave mode to count UP
|
|
pwm->MODE = (PWM_MODE_UPDOWN_Up << PWM_MODE_UPDOWN_Pos);
|
|
|
|
// Set the PWM to use the 16MHz clock
|
|
pwm->PRESCALER =
|
|
(PWM_PRESCALER_PRESCALER_DIV_1 << PWM_PRESCALER_PRESCALER_Pos);
|
|
|
|
// Setting of the maximum count
|
|
// but keeping it on 16Mhz allows for more granularity just
|
|
// in case someone wants to do more fine-tuning of the timing.
|
|
#if defined(NEO_KHZ400)
|
|
if (!is800KHz) {
|
|
pwm->COUNTERTOP = (CTOPVAL_400KHz << PWM_COUNTERTOP_COUNTERTOP_Pos);
|
|
} else
|
|
#endif
|
|
{
|
|
pwm->COUNTERTOP = (CTOPVAL << PWM_COUNTERTOP_COUNTERTOP_Pos);
|
|
}
|
|
|
|
// Disable loops, we want the sequence to repeat only once
|
|
pwm->LOOP = (PWM_LOOP_CNT_Disabled << PWM_LOOP_CNT_Pos);
|
|
|
|
// On the "Common" setting the PWM uses the same pattern for the
|
|
// for supported sequences. The pattern is stored on half-word
|
|
// of 16bits
|
|
pwm->DECODER = (PWM_DECODER_LOAD_Common << PWM_DECODER_LOAD_Pos) |
|
|
(PWM_DECODER_MODE_RefreshCount << PWM_DECODER_MODE_Pos);
|
|
|
|
// Pointer to the memory storing the patter
|
|
pwm->SEQ[0].PTR = (uint32_t)(pixels_pattern) << PWM_SEQ_PTR_PTR_Pos;
|
|
|
|
// Calculation of the number of steps loaded from memory.
|
|
pwm->SEQ[0].CNT = (pattern_size / sizeof(uint16_t)) << PWM_SEQ_CNT_CNT_Pos;
|
|
|
|
// The following settings are ignored with the current config.
|
|
pwm->SEQ[0].REFRESH = 0;
|
|
pwm->SEQ[0].ENDDELAY = 0;
|
|
|
|
// The Neopixel implementation is a blocking algorithm. DMA
|
|
// allows for non-blocking operation. To "simulate" a blocking
|
|
// operation we enable the interruption for the end of sequence
|
|
// and block the execution thread until the event flag is set by
|
|
// the peripheral.
|
|
// pwm->INTEN |= (PWM_INTEN_SEQEND0_Enabled<<PWM_INTEN_SEQEND0_Pos);
|
|
|
|
// PSEL must be configured before enabling PWM
|
|
#if defined(ARDUINO_ARCH_NRF52840)
|
|
pwm->PSEL.OUT[0] = g_APinDescription[pin].name;
|
|
#else
|
|
pwm->PSEL.OUT[0] = g_ADigitalPinMap[pin];
|
|
#endif
|
|
|
|
// Enable the PWM
|
|
pwm->ENABLE = 1;
|
|
|
|
// After all of this and many hours of reading the documentation
|
|
// we are ready to start the sequence...
|
|
pwm->EVENTS_SEQEND[0] = 0;
|
|
pwm->TASKS_SEQSTART[0] = 1;
|
|
|
|
// But we have to wait for the flag to be set.
|
|
while (!pwm->EVENTS_SEQEND[0]) {
|
|
#if defined(ARDUINO_NRF52_ADAFRUIT) || defined(ARDUINO_ARCH_NRF52840)
|
|
yield();
|
|
#endif
|
|
}
|
|
|
|
// Before leave we clear the flag for the event.
|
|
pwm->EVENTS_SEQEND[0] = 0;
|
|
|
|
// We need to disable the device and disconnect
|
|
// all the outputs before leave or the device will not
|
|
// be selected on the next call.
|
|
// TODO: Check if disabling the device causes performance issues.
|
|
pwm->ENABLE = 0;
|
|
|
|
pwm->PSEL.OUT[0] = 0xFFFFFFFFUL;
|
|
|
|
#if defined(ARDUINO_NRF52_ADAFRUIT) // use thread-safe free
|
|
rtos_free(pixels_pattern);
|
|
#else
|
|
free(pixels_pattern);
|
|
#endif
|
|
} // End of DMA implementation
|
|
// ---------------------------------------------------------------------
|
|
else {
|
|
#ifndef ARDUINO_ARCH_NRF52840
|
|
// Fall back to DWT
|
|
#if defined(ARDUINO_NRF52_ADAFRUIT)
|
|
// Bluefruit Feather 52 uses freeRTOS
|
|
// Critical Section is used since it does not block SoftDevice execution
|
|
taskENTER_CRITICAL();
|
|
#elif defined(NRF52_DISABLE_INT)
|
|
// If you are using the Bluetooth SoftDevice we advise you to not disable
|
|
// the interrupts. Disabling the interrupts even for short periods of time
|
|
// causes the SoftDevice to stop working.
|
|
// Disable the interrupts only in cases where you need high performance for
|
|
// the LEDs and if you are not using the EasyDMA feature.
|
|
__disable_irq();
|
|
#endif
|
|
|
|
NRF_GPIO_Type *nrf_port = (NRF_GPIO_Type *)digitalPinToPort(pin);
|
|
uint32_t pinMask = digitalPinToBitMask(pin);
|
|
|
|
uint32_t CYCLES_X00 = CYCLES_800;
|
|
uint32_t CYCLES_X00_T1H = CYCLES_800_T1H;
|
|
uint32_t CYCLES_X00_T0H = CYCLES_800_T0H;
|
|
|
|
#if defined(NEO_KHZ400)
|
|
if (!is800KHz) {
|
|
CYCLES_X00 = CYCLES_400;
|
|
CYCLES_X00_T1H = CYCLES_400_T1H;
|
|
CYCLES_X00_T0H = CYCLES_400_T0H;
|
|
}
|
|
#endif
|
|
|
|
// Enable DWT in debug core
|
|
CoreDebug->DEMCR |= CoreDebug_DEMCR_TRCENA_Msk;
|
|
DWT->CTRL |= DWT_CTRL_CYCCNTENA_Msk;
|
|
|
|
// Tries to re-send the frame if is interrupted by the SoftDevice.
|
|
while (1) {
|
|
uint8_t *p = pixels;
|
|
|
|
uint32_t cycStart = DWT->CYCCNT;
|
|
uint32_t cyc = 0;
|
|
|
|
for (uint16_t n = 0; n < numBytes; n++) {
|
|
uint8_t pix = *p++;
|
|
|
|
for (uint8_t mask = 0x80; mask; mask >>= 1) {
|
|
while (DWT->CYCCNT - cyc < CYCLES_X00)
|
|
;
|
|
cyc = DWT->CYCCNT;
|
|
|
|
nrf_port->OUTSET |= pinMask;
|
|
|
|
if (pix & mask) {
|
|
while (DWT->CYCCNT - cyc < CYCLES_X00_T1H)
|
|
;
|
|
} else {
|
|
while (DWT->CYCCNT - cyc < CYCLES_X00_T0H)
|
|
;
|
|
}
|
|
|
|
nrf_port->OUTCLR |= pinMask;
|
|
}
|
|
}
|
|
while (DWT->CYCCNT - cyc < CYCLES_X00)
|
|
;
|
|
|
|
// If total time longer than 25%, resend the whole data.
|
|
// Since we are likely to be interrupted by SoftDevice
|
|
if ((DWT->CYCCNT - cycStart) < (8 * numBytes * ((CYCLES_X00 * 5) / 4))) {
|
|
break;
|
|
}
|
|
|
|
// re-send need 300us delay
|
|
delayMicroseconds(300);
|
|
}
|
|
|
|
// Enable interrupts again
|
|
#if defined(ARDUINO_NRF52_ADAFRUIT)
|
|
taskEXIT_CRITICAL();
|
|
#elif defined(NRF52_DISABLE_INT)
|
|
__enable_irq();
|
|
#endif
|
|
#endif
|
|
}
|
|
// END of NRF52 implementation
|
|
|
|
#elif defined(__SAMD21E17A__) || defined(__SAMD21G18A__) || \
|
|
defined(__SAMD21E18A__) || defined(__SAMD21J18A__) || \
|
|
defined(__SAMD11C14A__) || defined(__SAMD21G17A__)
|
|
// Arduino Zero, Gemma/Trinket M0, SODAQ Autonomo
|
|
// and others
|
|
// Tried this with a timer/counter, couldn't quite get adequate
|
|
// resolution. So yay, you get a load of goofball NOPs...
|
|
|
|
uint8_t *ptr, *end, p, bitMask, portNum;
|
|
uint32_t pinMask;
|
|
|
|
portNum = g_APinDescription[pin].ulPort;
|
|
pinMask = 1ul << g_APinDescription[pin].ulPin;
|
|
ptr = pixels;
|
|
end = ptr + numBytes;
|
|
p = *ptr++;
|
|
bitMask = 0x80;
|
|
|
|
volatile uint32_t *set = &(PORT->Group[portNum].OUTSET.reg),
|
|
*clr = &(PORT->Group[portNum].OUTCLR.reg);
|
|
|
|
#if defined(NEO_KHZ400) // 800 KHz check needed only if 400 KHz support enabled
|
|
if (is800KHz) {
|
|
#endif
|
|
for (;;) {
|
|
*set = pinMask;
|
|
asm("nop; nop; nop; nop; nop; nop; nop; nop;");
|
|
if (p & bitMask) {
|
|
asm("nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop;");
|
|
*clr = pinMask;
|
|
} else {
|
|
*clr = pinMask;
|
|
asm("nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop;");
|
|
}
|
|
if (bitMask >>= 1) {
|
|
asm("nop; nop; nop; nop; nop; nop; nop; nop; nop;");
|
|
} else {
|
|
if (ptr >= end)
|
|
break;
|
|
p = *ptr++;
|
|
bitMask = 0x80;
|
|
}
|
|
}
|
|
#if defined(NEO_KHZ400)
|
|
} else { // 400 KHz bitstream
|
|
for (;;) {
|
|
*set = pinMask;
|
|
asm("nop; nop; nop; nop; nop; nop; nop; nop; nop; nop; nop;");
|
|
if (p & bitMask) {
|
|
asm("nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop;");
|
|
*clr = pinMask;
|
|
} else {
|
|
*clr = pinMask;
|
|
asm("nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop;");
|
|
}
|
|
asm("nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;");
|
|
if (bitMask >>= 1) {
|
|
asm("nop; nop; nop; nop; nop; nop; nop;");
|
|
} else {
|
|
if (ptr >= end)
|
|
break;
|
|
p = *ptr++;
|
|
bitMask = 0x80;
|
|
}
|
|
}
|
|
}
|
|
#endif
|
|
|
|
//----
|
|
#elif defined(XMC1100_XMC2GO) || defined(XMC1100_H_BRIDGE2GO) || defined(XMC1100_Boot_Kit) || defined(XMC1300_Boot_Kit)
|
|
|
|
// XMC1100/1200/1300 with ARM Cortex M0 are running with 32MHz, XMC1400 runs with 48MHz so may not work
|
|
// Tried this with a timer/counter, couldn't quite get adequate
|
|
// resolution. So yay, you get a load of goofball NOPs...
|
|
|
|
uint8_t *ptr, *end, p, bitMask, portNum;
|
|
uint32_t pinMask;
|
|
|
|
ptr = pixels;
|
|
end = ptr + numBytes;
|
|
p = *ptr++;
|
|
bitMask = 0x80;
|
|
|
|
XMC_GPIO_PORT_t* XMC_port = mapping_port_pin[ pin ].port;
|
|
uint8_t XMC_pin = mapping_port_pin[ pin ].pin;
|
|
|
|
uint32_t omrhigh = (uint32_t)XMC_GPIO_OUTPUT_LEVEL_HIGH << XMC_pin;
|
|
uint32_t omrlow = (uint32_t)XMC_GPIO_OUTPUT_LEVEL_LOW << XMC_pin;
|
|
|
|
#ifdef NEO_KHZ400 // 800 KHz check needed only if 400 KHz support enabled
|
|
if(is800KHz) {
|
|
#endif
|
|
for(;;) {
|
|
XMC_port->OMR = omrhigh;
|
|
asm("nop; nop; nop; nop;");
|
|
if(p & bitMask) {
|
|
asm("nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop;");
|
|
XMC_port->OMR = omrlow;
|
|
} else {
|
|
XMC_port->OMR = omrlow;
|
|
asm("nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop;");
|
|
}
|
|
if(bitMask >>= 1) {
|
|
asm("nop; nop; nop; nop; nop;");
|
|
} else {
|
|
if(ptr >= end) break;
|
|
p = *ptr++;
|
|
bitMask = 0x80;
|
|
}
|
|
}
|
|
#ifdef NEO_KHZ400 // untested code
|
|
} else { // 400 KHz bitstream
|
|
for(;;) {
|
|
XMC_port->OMR = omrhigh;
|
|
asm("nop; nop; nop; nop; nop;");
|
|
if(p & bitMask) {
|
|
asm("nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop;");
|
|
XMC_port->OMR = omrlow;
|
|
} else {
|
|
XMC_port->OMR = omrlow;
|
|
asm("nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop;");
|
|
}
|
|
asm("nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;");
|
|
if(bitMask >>= 1) {
|
|
asm("nop; nop; nop;");
|
|
} else {
|
|
if(ptr >= end) break;
|
|
p = *ptr++;
|
|
bitMask = 0x80;
|
|
}
|
|
}
|
|
}
|
|
|
|
#endif
|
|
//----
|
|
|
|
//----
|
|
#elif defined(XMC4700_Relax_Kit) || defined(XMC4800_Relax_Kit)
|
|
|
|
// XMC4700 and XMC4800 with ARM Cortex M4 are running with 144MHz
|
|
// Tried this with a timer/counter, couldn't quite get adequate
|
|
// resolution. So yay, you get a load of goofball NOPs...
|
|
|
|
uint8_t *ptr, *end, p, bitMask, portNum;
|
|
uint32_t pinMask;
|
|
|
|
ptr = pixels;
|
|
end = ptr + numBytes;
|
|
p = *ptr++;
|
|
bitMask = 0x80;
|
|
|
|
XMC_GPIO_PORT_t* XMC_port = mapping_port_pin[ pin ].port;
|
|
uint8_t XMC_pin = mapping_port_pin[ pin ].pin;
|
|
|
|
uint32_t omrhigh = (uint32_t)XMC_GPIO_OUTPUT_LEVEL_HIGH << XMC_pin;
|
|
uint32_t omrlow = (uint32_t)XMC_GPIO_OUTPUT_LEVEL_LOW << XMC_pin;
|
|
|
|
#ifdef NEO_KHZ400 // 800 KHz check needed only if 400 KHz support enabled
|
|
if(is800KHz) {
|
|
#endif
|
|
|
|
for(;;) {
|
|
XMC_port->OMR = omrhigh;
|
|
asm("nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop;");
|
|
if(p & bitMask) {
|
|
asm("nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;");
|
|
XMC_port->OMR = omrlow;
|
|
} else {
|
|
XMC_port->OMR = omrlow;
|
|
asm("nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;");
|
|
}
|
|
if(bitMask >>= 1) {
|
|
asm("nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;");
|
|
} else {
|
|
if(ptr >= end) break;
|
|
p = *ptr++;
|
|
bitMask = 0x80;
|
|
}
|
|
}
|
|
|
|
|
|
#ifdef NEO_KHZ400
|
|
} else { // 400 KHz bitstream
|
|
// ToDo!
|
|
}
|
|
#endif
|
|
//----
|
|
|
|
#elif defined(__SAMD51__) // M4
|
|
|
|
uint8_t *ptr, *end, p, bitMask, portNum, bit;
|
|
uint32_t pinMask;
|
|
|
|
portNum = g_APinDescription[pin].ulPort;
|
|
pinMask = 1ul << g_APinDescription[pin].ulPin;
|
|
ptr = pixels;
|
|
end = ptr + numBytes;
|
|
p = *ptr++;
|
|
bitMask = 0x80;
|
|
|
|
volatile uint32_t *set = &(PORT->Group[portNum].OUTSET.reg),
|
|
*clr = &(PORT->Group[portNum].OUTCLR.reg);
|
|
|
|
// SAMD51 overclock-compatible timing is only a mild abomination.
|
|
// It uses SysTick for a consistent clock reference regardless of
|
|
// optimization / cache settings. That's the good news. The bad news,
|
|
// since SysTick->VAL is a volatile type it's slow to access...and then,
|
|
// with the SysTick interval that Arduino sets up (1 ms), this would
|
|
// require a subtract and MOD operation for gauging elapsed time, and
|
|
// all taken in combination that lacks adequate temporal resolution
|
|
// for NeoPixel timing. So a kind of horrible thing is done here...
|
|
// since interrupts are turned off anyway and it's generally accepted
|
|
// by now that we're gonna lose track of time in the NeoPixel lib,
|
|
// the SysTick timer is reconfigured for a period matching the NeoPixel
|
|
// bit timing (either 800 or 400 KHz) and we watch SysTick->VAL very
|
|
// closely (just a threshold, no subtract or MOD or anything) and that
|
|
// seems to work just well enough. When finished, the SysTick
|
|
// peripheral is set back to its original state.
|
|
|
|
uint32_t t0, t1, top, ticks, saveLoad = SysTick->LOAD, saveVal = SysTick->VAL;
|
|
|
|
#if defined(NEO_KHZ400) // 800 KHz check needed only if 400 KHz support enabled
|
|
if (is800KHz) {
|
|
#endif
|
|
top = (uint32_t)(F_CPU * 0.00000125); // Bit hi + lo = 1.25 uS
|
|
t0 = top - (uint32_t)(F_CPU * 0.00000040); // 0 = 0.4 uS hi
|
|
t1 = top - (uint32_t)(F_CPU * 0.00000080); // 1 = 0.8 uS hi
|
|
#if defined(NEO_KHZ400)
|
|
} else { // 400 KHz bitstream
|
|
top = (uint32_t)(F_CPU * 0.00000250); // Bit hi + lo = 2.5 uS
|
|
t0 = top - (uint32_t)(F_CPU * 0.00000050); // 0 = 0.5 uS hi
|
|
t1 = top - (uint32_t)(F_CPU * 0.00000120); // 1 = 1.2 uS hi
|
|
}
|
|
#endif
|
|
|
|
SysTick->LOAD = top; // Config SysTick for NeoPixel bit freq
|
|
SysTick->VAL = top; // Set to start value (counts down)
|
|
(void)SysTick->VAL; // Dummy read helps sync up 1st bit
|
|
|
|
for (;;) {
|
|
*set = pinMask; // Set output high
|
|
ticks = (p & bitMask) ? t1 : t0; // SysTick threshold,
|
|
while (SysTick->VAL > ticks)
|
|
; // wait for it
|
|
*clr = pinMask; // Set output low
|
|
if (!(bitMask >>= 1)) { // Next bit for this byte...done?
|
|
if (ptr >= end)
|
|
break; // If last byte sent, exit loop
|
|
p = *ptr++; // Fetch next byte
|
|
bitMask = 0x80; // Reset bitmask
|
|
}
|
|
while (SysTick->VAL <= ticks)
|
|
; // Wait for rollover to 'top'
|
|
}
|
|
|
|
SysTick->LOAD = saveLoad; // Restore SysTick rollover to 1 ms
|
|
SysTick->VAL = saveVal; // Restore SysTick value
|
|
|
|
#elif defined(ARDUINO_STM32_FEATHER) // FEATHER WICED (120MHz)
|
|
|
|
// Tried this with a timer/counter, couldn't quite get adequate
|
|
// resolution. So yay, you get a load of goofball NOPs...
|
|
|
|
uint8_t *ptr, *end, p, bitMask;
|
|
uint32_t pinMask;
|
|
|
|
pinMask = BIT(PIN_MAP[pin].gpio_bit);
|
|
ptr = pixels;
|
|
end = ptr + numBytes;
|
|
p = *ptr++;
|
|
bitMask = 0x80;
|
|
|
|
volatile uint16_t *set = &(PIN_MAP[pin].gpio_device->regs->BSRRL);
|
|
volatile uint16_t *clr = &(PIN_MAP[pin].gpio_device->regs->BSRRH);
|
|
|
|
#if defined(NEO_KHZ400) // 800 KHz check needed only if 400 KHz support enabled
|
|
if (is800KHz) {
|
|
#endif
|
|
for (;;) {
|
|
if (p & bitMask) { // ONE
|
|
// High 800ns
|
|
*set = pinMask;
|
|
asm("nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop;");
|
|
// Low 450ns
|
|
*clr = pinMask;
|
|
asm("nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop;");
|
|
} else { // ZERO
|
|
// High 400ns
|
|
*set = pinMask;
|
|
asm("nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop;");
|
|
// Low 850ns
|
|
*clr = pinMask;
|
|
asm("nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop; nop; nop; nop; nop;"
|
|
"nop; nop; nop; nop;");
|
|
}
|
|
if (bitMask >>= 1) {
|
|
// Move on to the next pixel
|
|
asm("nop;");
|
|
} else {
|
|
if (ptr >= end)
|
|
break;
|
|
p = *ptr++;
|
|
bitMask = 0x80;
|
|
}
|
|
}
|
|
#if defined(NEO_KHZ400)
|
|
} else { // 400 KHz bitstream
|
|
// ToDo!
|
|
}
|
|
#endif
|
|
|
|
#elif defined(TARGET_LPC1768)
|
|
uint8_t *ptr, *end, p, bitMask;
|
|
ptr = pixels;
|
|
end = ptr + numBytes;
|
|
p = *ptr++;
|
|
bitMask = 0x80;
|
|
|
|
#if defined(NEO_KHZ400) // 800 KHz check needed only if 400 KHz support enabled
|
|
if (is800KHz) {
|
|
#endif
|
|
for (;;) {
|
|
if (p & bitMask) {
|
|
// data ONE high
|
|
// min: 550 typ: 700 max: 5,500
|
|
gpio_set(pin);
|
|
time::delay_ns(550);
|
|
// min: 450 typ: 600 max: 5,000
|
|
gpio_clear(pin);
|
|
time::delay_ns(450);
|
|
} else {
|
|
// data ZERO high
|
|
// min: 200 typ: 350 max: 500
|
|
gpio_set(pin);
|
|
time::delay_ns(200);
|
|
// data low
|
|
// min: 450 typ: 600 max: 5,000
|
|
gpio_clear(pin);
|
|
time::delay_ns(450);
|
|
}
|
|
if (bitMask >>= 1) {
|
|
// Move on to the next pixel
|
|
asm("nop;");
|
|
} else {
|
|
if (ptr >= end)
|
|
break;
|
|
p = *ptr++;
|
|
bitMask = 0x80;
|
|
}
|
|
}
|
|
#if defined(NEO_KHZ400)
|
|
} else { // 400 KHz bitstream
|
|
// ToDo!
|
|
}
|
|
#endif
|
|
#elif defined(ARDUINO_ARCH_STM32) || defined(ARDUINO_ARCH_ARDUINO_CORE_STM32)
|
|
uint8_t *p = pixels, *end = p + numBytes, pix = *p++, mask = 0x80;
|
|
uint32_t cyc;
|
|
uint32_t saveLoad = SysTick->LOAD, saveVal = SysTick->VAL;
|
|
#if defined(NEO_KHZ400) // 800 KHz check needed only if 400 KHz support enabled
|
|
if (is800KHz) {
|
|
#endif
|
|
uint32_t top = (F_CPU / 800000); // 1.25µs
|
|
uint32_t t0 = top - (F_CPU / 2500000); // 0.4µs
|
|
uint32_t t1 = top - (F_CPU / 1250000); // 0.8µs
|
|
SysTick->LOAD = top - 1; // Config SysTick for NeoPixel bit freq
|
|
SysTick->VAL = 0; // Set to start value
|
|
for (;;) {
|
|
LL_GPIO_SetOutputPin(gpioPort, gpioPin);
|
|
cyc = (pix & mask) ? t1 : t0;
|
|
while (SysTick->VAL > cyc)
|
|
;
|
|
LL_GPIO_ResetOutputPin(gpioPort, gpioPin);
|
|
if (!(mask >>= 1)) {
|
|
if (p >= end)
|
|
break;
|
|
pix = *p++;
|
|
mask = 0x80;
|
|
}
|
|
while (SysTick->VAL <= cyc)
|
|
;
|
|
}
|
|
#if defined(NEO_KHZ400)
|
|
} else { // 400 kHz bitstream
|
|
uint32_t top = (F_CPU / 400000); // 2.5µs
|
|
uint32_t t0 = top - (F_CPU / 2000000); // 0.5µs
|
|
uint32_t t1 = top - (F_CPU / 833333); // 1.2µs
|
|
SysTick->LOAD = top - 1; // Config SysTick for NeoPixel bit freq
|
|
SysTick->VAL = 0; // Set to start value
|
|
for (;;) {
|
|
LL_GPIO_SetOutputPin(gpioPort, gpioPin);
|
|
cyc = (pix & mask) ? t1 : t0;
|
|
while (SysTick->VAL > cyc)
|
|
;
|
|
LL_GPIO_ResetOutputPin(gpioPort, gpioPin);
|
|
if (!(mask >>= 1)) {
|
|
if (p >= end)
|
|
break;
|
|
pix = *p++;
|
|
mask = 0x80;
|
|
}
|
|
while (SysTick->VAL <= cyc)
|
|
;
|
|
}
|
|
}
|
|
#endif // NEO_KHZ400
|
|
SysTick->LOAD = saveLoad; // Restore SysTick rollover to 1 ms
|
|
SysTick->VAL = saveVal; // Restore SysTick value
|
|
#elif defined(NRF51)
|
|
uint8_t *p = pixels, pix, count, mask;
|
|
int32_t num = numBytes;
|
|
unsigned int bitmask = (1 << g_ADigitalPinMap[pin]);
|
|
// https://github.com/sandeepmistry/arduino-nRF5/blob/dc53980c8bac27898fca90d8ecb268e11111edc1/variants/BBCmicrobit/variant.cpp
|
|
|
|
volatile unsigned int *reg = (unsigned int *)(0x50000000UL + 0x508);
|
|
|
|
// https://github.com/sandeepmistry/arduino-nRF5/blob/dc53980c8bac27898fca90d8ecb268e11111edc1/cores/nRF5/SDK/components/device/nrf51.h
|
|
// http://www.iot-programmer.com/index.php/books/27-micro-bit-iot-in-c/chapters-micro-bit-iot-in-c/47-micro-bit-iot-in-c-fast-memory-mapped-gpio?showall=1
|
|
// https://github.com/Microsoft/pxt-neopixel/blob/master/sendbuffer.asm
|
|
|
|
asm volatile(
|
|
// "cpsid i" ; disable irq
|
|
|
|
// b .start
|
|
"b L%=_start"
|
|
"\n\t"
|
|
// .nextbit: ; C0
|
|
"L%=_nextbit:"
|
|
"\n\t" //; C0
|
|
// str r1, [r3, #0] ; pin := hi C2
|
|
"strb %[bitmask], [%[reg], #0]"
|
|
"\n\t" //; pin := hi C2
|
|
// tst r6, r0 ; C3
|
|
"tst %[mask], %[pix]"
|
|
"\n\t" // ; C3
|
|
// bne .islate ; C4
|
|
"bne L%=_islate"
|
|
"\n\t" //; C4
|
|
// str r1, [r2, #0] ; pin := lo C6
|
|
"strb %[bitmask], [%[reg], #4]"
|
|
"\n\t" //; pin := lo C6
|
|
// .islate:
|
|
"L%=_islate:"
|
|
"\n\t"
|
|
// lsrs r6, r6, #1 ; r6 >>= 1 C7
|
|
"lsr %[mask], %[mask], #1"
|
|
"\n\t" //; r6 >>= 1 C7
|
|
// bne .justbit ; C8
|
|
"bne L%=_justbit"
|
|
"\n\t" //; C8
|
|
|
|
// ; not just a bit - need new byte
|
|
// adds r4, #1 ; r4++ C9
|
|
"add %[p], #1"
|
|
"\n\t" //; r4++ C9
|
|
// subs r5, #1 ; r5-- C10
|
|
"sub %[num], #1"
|
|
"\n\t" //; r5-- C10
|
|
// bcc .stop ; if (r5<0) goto .stop C11
|
|
"bcc L%=_stop"
|
|
"\n\t" //; if (r5<0) goto .stop C11
|
|
// .start:
|
|
"L%=_start:"
|
|
// movs r6, #0x80 ; reset mask C12
|
|
"movs %[mask], #0x80"
|
|
"\n\t" //; reset mask C12
|
|
// nop ; C13
|
|
"nop"
|
|
"\n\t" //; C13
|
|
|
|
// .common: ; C13
|
|
"L%=_common:"
|
|
"\n\t" //; C13
|
|
// str r1, [r2, #0] ; pin := lo C15
|
|
"strb %[bitmask], [%[reg], #4]"
|
|
"\n\t" //; pin := lo C15
|
|
// ; always re-load byte - it just fits with the cycles better this way
|
|
// ldrb r0, [r4, #0] ; r0 := *r4 C17
|
|
"ldrb %[pix], [%[p], #0]"
|
|
"\n\t" //; r0 := *r4 C17
|
|
// b .nextbit ; C20
|
|
"b L%=_nextbit"
|
|
"\n\t" //; C20
|
|
|
|
// .justbit: ; C10
|
|
"L%=_justbit:"
|
|
"\n\t" //; C10
|
|
// ; no nops, branch taken is already 3 cycles
|
|
// b .common ; C13
|
|
"b L%=_common"
|
|
"\n\t" //; C13
|
|
|
|
// .stop:
|
|
"L%=_stop:"
|
|
"\n\t"
|
|
// str r1, [r2, #0] ; pin := lo
|
|
"strb %[bitmask], [%[reg], #4]"
|
|
"\n\t" //; pin := lo
|
|
// cpsie i ; enable irq
|
|
|
|
: [p] "+r"(p), [pix] "=&r"(pix), [count] "=&r"(count), [mask] "=&r"(mask),
|
|
[num] "+r"(num)
|
|
: [bitmask] "r"(bitmask), [reg] "r"(reg));
|
|
|
|
#elif defined(__SAM3X8E__) // Arduino Due
|
|
|
|
#define SCALE VARIANT_MCK / 2UL / 1000000UL
|
|
#define INST (2UL * F_CPU / VARIANT_MCK)
|
|
#define TIME_800_0 ((int)(0.40 * SCALE + 0.5) - (5 * INST))
|
|
#define TIME_800_1 ((int)(0.80 * SCALE + 0.5) - (5 * INST))
|
|
#define PERIOD_800 ((int)(1.25 * SCALE + 0.5) - (5 * INST))
|
|
#define TIME_400_0 ((int)(0.50 * SCALE + 0.5) - (5 * INST))
|
|
#define TIME_400_1 ((int)(1.20 * SCALE + 0.5) - (5 * INST))
|
|
#define PERIOD_400 ((int)(2.50 * SCALE + 0.5) - (5 * INST))
|
|
|
|
int pinMask, time0, time1, period, t;
|
|
Pio *port;
|
|
volatile WoReg *portSet, *portClear, *timeValue, *timeReset;
|
|
uint8_t *p, *end, pix, mask;
|
|
|
|
pmc_set_writeprotect(false);
|
|
pmc_enable_periph_clk((uint32_t)TC3_IRQn);
|
|
TC_Configure(TC1, 0,
|
|
TC_CMR_WAVE | TC_CMR_WAVSEL_UP | TC_CMR_TCCLKS_TIMER_CLOCK1);
|
|
TC_Start(TC1, 0);
|
|
|
|
pinMask = g_APinDescription[pin].ulPin; // Don't 'optimize' these into
|
|
port = g_APinDescription[pin].pPort; // declarations above. Want to
|
|
portSet = &(port->PIO_SODR); // burn a few cycles after
|
|
portClear = &(port->PIO_CODR); // starting timer to minimize
|
|
timeValue = &(TC1->TC_CHANNEL[0].TC_CV); // the initial 'while'.
|
|
timeReset = &(TC1->TC_CHANNEL[0].TC_CCR);
|
|
p = pixels;
|
|
end = p + numBytes;
|
|
pix = *p++;
|
|
mask = 0x80;
|
|
|
|
#if defined(NEO_KHZ400) // 800 KHz check needed only if 400 KHz support enabled
|
|
if (is800KHz) {
|
|
#endif
|
|
time0 = TIME_800_0;
|
|
time1 = TIME_800_1;
|
|
period = PERIOD_800;
|
|
#if defined(NEO_KHZ400)
|
|
} else { // 400 KHz bitstream
|
|
time0 = TIME_400_0;
|
|
time1 = TIME_400_1;
|
|
period = PERIOD_400;
|
|
}
|
|
#endif
|
|
|
|
for (t = time0;; t = time0) {
|
|
if (pix & mask)
|
|
t = time1;
|
|
while (*timeValue < (unsigned)period)
|
|
;
|
|
*portSet = pinMask;
|
|
*timeReset = TC_CCR_CLKEN | TC_CCR_SWTRG;
|
|
while (*timeValue < (unsigned)t)
|
|
;
|
|
*portClear = pinMask;
|
|
if (!(mask >>= 1)) { // This 'inside-out' loop logic utilizes
|
|
if (p >= end)
|
|
break; // idle time to minimize inter-byte delays.
|
|
pix = *p++;
|
|
mask = 0x80;
|
|
}
|
|
}
|
|
while (*timeValue < (unsigned)period)
|
|
; // Wait for last bit
|
|
TC_Stop(TC1, 0);
|
|
|
|
|
|
// RENESAS including UNO R4
|
|
#elif defined(ARDUINO_ARCH_RENESAS) || defined(ARDUINO_ARCH_RENESAS_UNO) || defined(ARDUINO_ARCH_RENESAS_PORTENTA)
|
|
|
|
// Definition for a single channel clockless controller for RA4M1 (Cortex M4)
|
|
// See clockless.h for detailed info on how the template parameters are used.
|
|
#define ARM_DEMCR (*(volatile uint32_t *)0xE000EDFC) // Debug Exception and Monitor Control
|
|
#define ARM_DEMCR_TRCENA (1 << 24) // Enable debugging & monitoring blocks
|
|
#define ARM_DWT_CTRL (*(volatile uint32_t *)0xE0001000) // DWT control register
|
|
#define ARM_DWT_CTRL_CYCCNTENA (1 << 0) // Enable cycle count
|
|
#define ARM_DWT_CYCCNT (*(volatile uint32_t *)0xE0001004) // Cycle count register
|
|
|
|
#define F_CPU 48000000
|
|
#define CYCLES_800_T0H (F_CPU / 4000000)
|
|
#define CYCLES_800_T1H (F_CPU / 1250000)
|
|
#define CYCLES_800 (F_CPU / 800000)
|
|
#define CYCLES_400_T0H (F_CPU / 2000000)
|
|
#define CYCLES_400_T1H (F_CPU / 833333)
|
|
#define CYCLES_400 (F_CPU / 400000)
|
|
|
|
uint8_t *p = pixels, *end = p + numBytes, pix, mask;
|
|
|
|
bsp_io_port_pin_t io_pin = g_pin_cfg[pin].pin;
|
|
#define PIN_IO_PORT_ADDR(pn) (R_PORT0 + ((uint32_t) (R_PORT1 - R_PORT0) * ((pn) >> 8u)))
|
|
|
|
volatile uint16_t *set = &(PIN_IO_PORT_ADDR(io_pin)->POSR);
|
|
volatile uint16_t *clr = &(PIN_IO_PORT_ADDR(io_pin)->PORR);
|
|
uint16_t msk = (1U << (io_pin & 0xFF));
|
|
|
|
uint32_t cyc;
|
|
|
|
ARM_DEMCR |= ARM_DEMCR_TRCENA;
|
|
ARM_DWT_CTRL |= ARM_DWT_CTRL_CYCCNTENA;
|
|
|
|
#if defined(NEO_KHZ400) // 800 KHz check needed only if 400 KHz support enabled
|
|
if (is800KHz) {
|
|
#endif
|
|
cyc = ARM_DWT_CYCCNT + CYCLES_800;
|
|
while (p < end) {
|
|
pix = *p++;
|
|
for (mask = 0x80; mask; mask >>= 1) {
|
|
while (ARM_DWT_CYCCNT - cyc < CYCLES_800)
|
|
;
|
|
cyc = ARM_DWT_CYCCNT;
|
|
*set = msk;
|
|
if (pix & mask) {
|
|
while (ARM_DWT_CYCCNT - cyc < CYCLES_800_T1H)
|
|
;
|
|
} else {
|
|
while (ARM_DWT_CYCCNT - cyc < CYCLES_800_T0H)
|
|
;
|
|
}
|
|
*clr = msk;
|
|
}
|
|
}
|
|
while (ARM_DWT_CYCCNT - cyc < CYCLES_800)
|
|
;
|
|
#if defined(NEO_KHZ400)
|
|
} else { // 400 kHz bitstream
|
|
cyc = ARM_DWT_CYCCNT + CYCLES_400;
|
|
while (p < end) {
|
|
pix = *p++;
|
|
for (mask = 0x80; mask; mask >>= 1) {
|
|
while (ARM_DWT_CYCCNT - cyc < CYCLES_400)
|
|
;
|
|
cyc = ARM_DWT_CYCCNT;
|
|
*set = msk;
|
|
if (pix & mask) {
|
|
while (ARM_DWT_CYCCNT - cyc < CYCLES_400_T1H)
|
|
;
|
|
} else {
|
|
while (ARM_DWT_CYCCNT - cyc < CYCLES_400_T0H)
|
|
;
|
|
}
|
|
*clr = msk;
|
|
}
|
|
}
|
|
while (ARM_DWT_CYCCNT - cyc < CYCLES_400)
|
|
;
|
|
}
|
|
#endif // NEO_KHZ400
|
|
|
|
#endif // ARM
|
|
|
|
// END ARM ----------------------------------------------------------------
|
|
|
|
#elif defined(ESP8266) || defined(ESP32)
|
|
|
|
// ESP8266 ----------------------------------------------------------------
|
|
|
|
// ESP8266 show() is external to enforce ICACHE_RAM_ATTR execution
|
|
espShow(pin, pixels, numBytes, is800KHz);
|
|
|
|
#elif defined(KENDRYTE_K210)
|
|
|
|
k210Show(pin, pixels, numBytes, is800KHz);
|
|
|
|
#elif defined(__ARDUINO_ARC__)
|
|
|
|
// Arduino 101 -----------------------------------------------------------
|
|
|
|
#define NOPx7 \
|
|
{ \
|
|
__builtin_arc_nop(); \
|
|
__builtin_arc_nop(); \
|
|
__builtin_arc_nop(); \
|
|
__builtin_arc_nop(); \
|
|
__builtin_arc_nop(); \
|
|
__builtin_arc_nop(); \
|
|
__builtin_arc_nop(); \
|
|
}
|
|
|
|
PinDescription *pindesc = &g_APinDescription[pin];
|
|
register uint32_t loop =
|
|
8 * numBytes; // one loop to handle all bytes and all bits
|
|
register uint8_t *p = pixels;
|
|
register uint32_t currByte = (uint32_t)(*p);
|
|
register uint32_t currBit = 0x80 & currByte;
|
|
register uint32_t bitCounter = 0;
|
|
register uint32_t first = 1;
|
|
|
|
// The loop is unusual. Very first iteration puts all the way LOW to the wire
|
|
// - constant LOW does not affect NEOPIXEL, so there is no visible effect
|
|
// displayed. During that very first iteration CPU caches instructions in the
|
|
// loop. Because of the caching process, "CPU slows down". NEOPIXEL pulse is
|
|
// very time sensitive that's why we let the CPU cache first and we start
|
|
// regular pulse from 2nd iteration
|
|
if (pindesc->ulGPIOType == SS_GPIO) {
|
|
register uint32_t reg = pindesc->ulGPIOBase + SS_GPIO_SWPORTA_DR;
|
|
uint32_t reg_val = __builtin_arc_lr((volatile uint32_t)reg);
|
|
register uint32_t reg_bit_high = reg_val | (1 << pindesc->ulGPIOId);
|
|
register uint32_t reg_bit_low = reg_val & ~(1 << pindesc->ulGPIOId);
|
|
|
|
loop += 1; // include first, special iteration
|
|
while (loop--) {
|
|
if (!first) {
|
|
currByte <<= 1;
|
|
bitCounter++;
|
|
}
|
|
|
|
// 1 is >550ns high and >450ns low; 0 is 200..500ns high and >450ns low
|
|
__builtin_arc_sr(first ? reg_bit_low : reg_bit_high,
|
|
(volatile uint32_t)reg);
|
|
if (currBit) { // ~400ns HIGH (740ns overall)
|
|
NOPx7 NOPx7
|
|
}
|
|
// ~340ns HIGH
|
|
NOPx7 __builtin_arc_nop();
|
|
|
|
// 820ns LOW; per spec, max allowed low here is 5000ns */
|
|
__builtin_arc_sr(reg_bit_low, (volatile uint32_t)reg);
|
|
NOPx7 NOPx7
|
|
|
|
if (bitCounter >= 8) {
|
|
bitCounter = 0;
|
|
currByte = (uint32_t)(*++p);
|
|
}
|
|
|
|
currBit = 0x80 & currByte;
|
|
first = 0;
|
|
}
|
|
} else if (pindesc->ulGPIOType == SOC_GPIO) {
|
|
register uint32_t reg = pindesc->ulGPIOBase + SOC_GPIO_SWPORTA_DR;
|
|
uint32_t reg_val = MMIO_REG_VAL(reg);
|
|
register uint32_t reg_bit_high = reg_val | (1 << pindesc->ulGPIOId);
|
|
register uint32_t reg_bit_low = reg_val & ~(1 << pindesc->ulGPIOId);
|
|
|
|
loop += 1; // include first, special iteration
|
|
while (loop--) {
|
|
if (!first) {
|
|
currByte <<= 1;
|
|
bitCounter++;
|
|
}
|
|
MMIO_REG_VAL(reg) = first ? reg_bit_low : reg_bit_high;
|
|
if (currBit) { // ~430ns HIGH (740ns overall)
|
|
NOPx7 NOPx7 __builtin_arc_nop();
|
|
}
|
|
// ~310ns HIGH
|
|
NOPx7
|
|
|
|
// 850ns LOW; per spec, max allowed low here is 5000ns */
|
|
MMIO_REG_VAL(reg) = reg_bit_low;
|
|
NOPx7 NOPx7
|
|
|
|
if (bitCounter >= 8) {
|
|
bitCounter = 0;
|
|
currByte = (uint32_t)(*++p);
|
|
}
|
|
|
|
currBit = 0x80 & currByte;
|
|
first = 0;
|
|
}
|
|
}
|
|
|
|
#elif defined(ARDUINO_ARCH_CH32)
|
|
ch32Show(gpioPort, gpioPin, pixels, numBytes, is800KHz);
|
|
#else
|
|
#error Architecture not supported
|
|
#endif
|
|
|
|
// END ARCHITECTURE SELECT ------------------------------------------------
|
|
|
|
#if !(defined(NRF52) || defined(NRF52_SERIES) || defined(ESP32))
|
|
interrupts();
|
|
#endif
|
|
|
|
endTime = micros(); // Save EOD time for latch on next call
|
|
}
|
|
|
|
/*!
|
|
@brief Set/change the NeoPixel output pin number. Previous pin,
|
|
if any, is set to INPUT and the new pin is set to OUTPUT.
|
|
@param p Arduino pin number (-1 = no pin).
|
|
*/
|
|
void Adafruit_NeoPixel::setPin(int16_t p) {
|
|
if (begun && (pin >= 0))
|
|
pinMode(pin, INPUT); // Disable existing out pin
|
|
pin = p;
|
|
if (begun) {
|
|
pinMode(p, OUTPUT);
|
|
digitalWrite(p, LOW);
|
|
}
|
|
#if defined(__AVR__)
|
|
port = portOutputRegister(digitalPinToPort(p));
|
|
pinMask = digitalPinToBitMask(p);
|
|
#endif
|
|
#if defined(ARDUINO_ARCH_STM32) || defined(ARDUINO_ARCH_ARDUINO_CORE_STM32)
|
|
gpioPort = digitalPinToPort(p);
|
|
gpioPin = STM_LL_GPIO_PIN(digitalPinToPinName(p));
|
|
#elif defined(ARDUINO_ARCH_CH32)
|
|
PinName const pin_name = digitalPinToPinName(pin);
|
|
gpioPort = get_GPIO_Port(CH_PORT(pin_name));
|
|
gpioPin = CH_GPIO_PIN(pin_name);
|
|
#if defined (CH32V20x_D6)
|
|
if (gpioPort == GPIOC && ((*(volatile uint32_t*)0x40022030) & 0x0F000000) == 0) {
|
|
gpioPin = gpioPin >> 13;
|
|
}
|
|
#endif
|
|
#endif
|
|
}
|
|
|
|
/*!
|
|
@brief Set a pixel's color using separate red, green and blue
|
|
components. If using RGBW pixels, white will be set to 0.
|
|
@param n Pixel index, starting from 0.
|
|
@param r Red brightness, 0 = minimum (off), 255 = maximum.
|
|
@param g Green brightness, 0 = minimum (off), 255 = maximum.
|
|
@param b Blue brightness, 0 = minimum (off), 255 = maximum.
|
|
*/
|
|
void Adafruit_NeoPixel::setPixelColor(uint16_t n, uint8_t r, uint8_t g,
|
|
uint8_t b) {
|
|
|
|
if (n < numLEDs) {
|
|
if (brightness) { // See notes in setBrightness()
|
|
r = (r * brightness) >> 8;
|
|
g = (g * brightness) >> 8;
|
|
b = (b * brightness) >> 8;
|
|
}
|
|
uint8_t *p;
|
|
if (wOffset == rOffset) { // Is an RGB-type strip
|
|
p = &pixels[n * 3]; // 3 bytes per pixel
|
|
} else { // Is a WRGB-type strip
|
|
p = &pixels[n * 4]; // 4 bytes per pixel
|
|
p[wOffset] = 0; // But only R,G,B passed -- set W to 0
|
|
}
|
|
p[rOffset] = r; // R,G,B always stored
|
|
p[gOffset] = g;
|
|
p[bOffset] = b;
|
|
}
|
|
}
|
|
|
|
/*!
|
|
@brief Set a pixel's color using separate red, green, blue and white
|
|
components (for RGBW NeoPixels only).
|
|
@param n Pixel index, starting from 0.
|
|
@param r Red brightness, 0 = minimum (off), 255 = maximum.
|
|
@param g Green brightness, 0 = minimum (off), 255 = maximum.
|
|
@param b Blue brightness, 0 = minimum (off), 255 = maximum.
|
|
@param w White brightness, 0 = minimum (off), 255 = maximum, ignored
|
|
if using RGB pixels.
|
|
*/
|
|
void Adafruit_NeoPixel::setPixelColor(uint16_t n, uint8_t r, uint8_t g,
|
|
uint8_t b, uint8_t w) {
|
|
|
|
if (n < numLEDs) {
|
|
if (brightness) { // See notes in setBrightness()
|
|
r = (r * brightness) >> 8;
|
|
g = (g * brightness) >> 8;
|
|
b = (b * brightness) >> 8;
|
|
w = (w * brightness) >> 8;
|
|
}
|
|
uint8_t *p;
|
|
if (wOffset == rOffset) { // Is an RGB-type strip
|
|
p = &pixels[n * 3]; // 3 bytes per pixel (ignore W)
|
|
} else { // Is a WRGB-type strip
|
|
p = &pixels[n * 4]; // 4 bytes per pixel
|
|
p[wOffset] = w; // Store W
|
|
}
|
|
p[rOffset] = r; // Store R,G,B
|
|
p[gOffset] = g;
|
|
p[bOffset] = b;
|
|
}
|
|
}
|
|
|
|
/*!
|
|
@brief Set a pixel's color using a 32-bit 'packed' RGB or RGBW value.
|
|
@param n Pixel index, starting from 0.
|
|
@param c 32-bit color value. Most significant byte is white (for RGBW
|
|
pixels) or ignored (for RGB pixels), next is red, then green,
|
|
and least significant byte is blue.
|
|
*/
|
|
void Adafruit_NeoPixel::setPixelColor(uint16_t n, uint32_t c) {
|
|
if (n < numLEDs) {
|
|
uint8_t *p, r = (uint8_t)(c >> 16), g = (uint8_t)(c >> 8), b = (uint8_t)c;
|
|
if (brightness) { // See notes in setBrightness()
|
|
r = (r * brightness) >> 8;
|
|
g = (g * brightness) >> 8;
|
|
b = (b * brightness) >> 8;
|
|
}
|
|
if (wOffset == rOffset) {
|
|
p = &pixels[n * 3];
|
|
} else {
|
|
p = &pixels[n * 4];
|
|
uint8_t w = (uint8_t)(c >> 24);
|
|
p[wOffset] = brightness ? ((w * brightness) >> 8) : w;
|
|
}
|
|
p[rOffset] = r;
|
|
p[gOffset] = g;
|
|
p[bOffset] = b;
|
|
}
|
|
}
|
|
|
|
/*!
|
|
@brief Fill all or part of the NeoPixel strip with a color.
|
|
@param c 32-bit color value. Most significant byte is white (for
|
|
RGBW pixels) or ignored (for RGB pixels), next is red,
|
|
then green, and least significant byte is blue. If all
|
|
arguments are unspecified, this will be 0 (off).
|
|
@param first Index of first pixel to fill, starting from 0. Must be
|
|
in-bounds, no clipping is performed. 0 if unspecified.
|
|
@param count Number of pixels to fill, as a positive value. Passing
|
|
0 or leaving unspecified will fill to end of strip.
|
|
*/
|
|
void Adafruit_NeoPixel::fill(uint32_t c, uint16_t first, uint16_t count) {
|
|
uint16_t i, end;
|
|
|
|
if (first >= numLEDs) {
|
|
return; // If first LED is past end of strip, nothing to do
|
|
}
|
|
|
|
// Calculate the index ONE AFTER the last pixel to fill
|
|
if (count == 0) {
|
|
// Fill to end of strip
|
|
end = numLEDs;
|
|
} else {
|
|
// Ensure that the loop won't go past the last pixel
|
|
end = first + count;
|
|
if (end > numLEDs)
|
|
end = numLEDs;
|
|
}
|
|
|
|
for (i = first; i < end; i++) {
|
|
this->setPixelColor(i, c);
|
|
}
|
|
}
|
|
|
|
/*!
|
|
@brief Convert hue, saturation and value into a packed 32-bit RGB color
|
|
that can be passed to setPixelColor() or other RGB-compatible
|
|
functions.
|
|
@param hue An unsigned 16-bit value, 0 to 65535, representing one full
|
|
loop of the color wheel, which allows 16-bit hues to "roll
|
|
over" while still doing the expected thing (and allowing
|
|
more precision than the wheel() function that was common to
|
|
prior NeoPixel examples).
|
|
@param sat Saturation, 8-bit value, 0 (min or pure grayscale) to 255
|
|
(max or pure hue). Default of 255 if unspecified.
|
|
@param val Value (brightness), 8-bit value, 0 (min / black / off) to
|
|
255 (max or full brightness). Default of 255 if unspecified.
|
|
@return Packed 32-bit RGB with the most significant byte set to 0 -- the
|
|
white element of WRGB pixels is NOT utilized. Result is linearly
|
|
but not perceptually correct, so you may want to pass the result
|
|
through the gamma32() function (or your own gamma-correction
|
|
operation) else colors may appear washed out. This is not done
|
|
automatically by this function because coders may desire a more
|
|
refined gamma-correction function than the simplified
|
|
one-size-fits-all operation of gamma32(). Diffusing the LEDs also
|
|
really seems to help when using low-saturation colors.
|
|
*/
|
|
uint32_t Adafruit_NeoPixel::ColorHSV(uint16_t hue, uint8_t sat, uint8_t val) {
|
|
|
|
uint8_t r, g, b;
|
|
|
|
// Remap 0-65535 to 0-1529. Pure red is CENTERED on the 64K rollover;
|
|
// 0 is not the start of pure red, but the midpoint...a few values above
|
|
// zero and a few below 65536 all yield pure red (similarly, 32768 is the
|
|
// midpoint, not start, of pure cyan). The 8-bit RGB hexcone (256 values
|
|
// each for red, green, blue) really only allows for 1530 distinct hues
|
|
// (not 1536, more on that below), but the full unsigned 16-bit type was
|
|
// chosen for hue so that one's code can easily handle a contiguous color
|
|
// wheel by allowing hue to roll over in either direction.
|
|
hue = (hue * 1530L + 32768) / 65536;
|
|
// Because red is centered on the rollover point (the +32768 above,
|
|
// essentially a fixed-point +0.5), the above actually yields 0 to 1530,
|
|
// where 0 and 1530 would yield the same thing. Rather than apply a
|
|
// costly modulo operator, 1530 is handled as a special case below.
|
|
|
|
// So you'd think that the color "hexcone" (the thing that ramps from
|
|
// pure red, to pure yellow, to pure green and so forth back to red,
|
|
// yielding six slices), and with each color component having 256
|
|
// possible values (0-255), might have 1536 possible items (6*256),
|
|
// but in reality there's 1530. This is because the last element in
|
|
// each 256-element slice is equal to the first element of the next
|
|
// slice, and keeping those in there this would create small
|
|
// discontinuities in the color wheel. So the last element of each
|
|
// slice is dropped...we regard only elements 0-254, with item 255
|
|
// being picked up as element 0 of the next slice. Like this:
|
|
// Red to not-quite-pure-yellow is: 255, 0, 0 to 255, 254, 0
|
|
// Pure yellow to not-quite-pure-green is: 255, 255, 0 to 1, 255, 0
|
|
// Pure green to not-quite-pure-cyan is: 0, 255, 0 to 0, 255, 254
|
|
// and so forth. Hence, 1530 distinct hues (0 to 1529), and hence why
|
|
// the constants below are not the multiples of 256 you might expect.
|
|
|
|
// Convert hue to R,G,B (nested ifs faster than divide+mod+switch):
|
|
if (hue < 510) { // Red to Green-1
|
|
b = 0;
|
|
if (hue < 255) { // Red to Yellow-1
|
|
r = 255;
|
|
g = hue; // g = 0 to 254
|
|
} else { // Yellow to Green-1
|
|
r = 510 - hue; // r = 255 to 1
|
|
g = 255;
|
|
}
|
|
} else if (hue < 1020) { // Green to Blue-1
|
|
r = 0;
|
|
if (hue < 765) { // Green to Cyan-1
|
|
g = 255;
|
|
b = hue - 510; // b = 0 to 254
|
|
} else { // Cyan to Blue-1
|
|
g = 1020 - hue; // g = 255 to 1
|
|
b = 255;
|
|
}
|
|
} else if (hue < 1530) { // Blue to Red-1
|
|
g = 0;
|
|
if (hue < 1275) { // Blue to Magenta-1
|
|
r = hue - 1020; // r = 0 to 254
|
|
b = 255;
|
|
} else { // Magenta to Red-1
|
|
r = 255;
|
|
b = 1530 - hue; // b = 255 to 1
|
|
}
|
|
} else { // Last 0.5 Red (quicker than % operator)
|
|
r = 255;
|
|
g = b = 0;
|
|
}
|
|
|
|
// Apply saturation and value to R,G,B, pack into 32-bit result:
|
|
uint32_t v1 = 1 + val; // 1 to 256; allows >>8 instead of /255
|
|
uint16_t s1 = 1 + sat; // 1 to 256; same reason
|
|
uint8_t s2 = 255 - sat; // 255 to 0
|
|
return ((((((r * s1) >> 8) + s2) * v1) & 0xff00) << 8) |
|
|
(((((g * s1) >> 8) + s2) * v1) & 0xff00) |
|
|
(((((b * s1) >> 8) + s2) * v1) >> 8);
|
|
}
|
|
|
|
/*!
|
|
@brief Query the color of a previously-set pixel.
|
|
@param n Index of pixel to read (0 = first).
|
|
@return 'Packed' 32-bit RGB or WRGB value. Most significant byte is white
|
|
(for RGBW pixels) or 0 (for RGB pixels), next is red, then green,
|
|
and least significant byte is blue.
|
|
@note If the strip brightness has been changed from the default value
|
|
of 255, the color read from a pixel may not exactly match what
|
|
was previously written with one of the setPixelColor() functions.
|
|
This gets more pronounced at lower brightness levels.
|
|
*/
|
|
uint32_t Adafruit_NeoPixel::getPixelColor(uint16_t n) const {
|
|
if (n >= numLEDs)
|
|
return 0; // Out of bounds, return no color.
|
|
|
|
uint8_t *p;
|
|
|
|
if (wOffset == rOffset) { // Is RGB-type device
|
|
p = &pixels[n * 3];
|
|
if (brightness) {
|
|
// Stored color was decimated by setBrightness(). Returned value
|
|
// attempts to scale back to an approximation of the original 24-bit
|
|
// value used when setting the pixel color, but there will always be
|
|
// some error -- those bits are simply gone. Issue is most
|
|
// pronounced at low brightness levels.
|
|
return (((uint32_t)(p[rOffset] << 8) / brightness) << 16) |
|
|
(((uint32_t)(p[gOffset] << 8) / brightness) << 8) |
|
|
((uint32_t)(p[bOffset] << 8) / brightness);
|
|
} else {
|
|
// No brightness adjustment has been made -- return 'raw' color
|
|
return ((uint32_t)p[rOffset] << 16) | ((uint32_t)p[gOffset] << 8) |
|
|
(uint32_t)p[bOffset];
|
|
}
|
|
} else { // Is RGBW-type device
|
|
p = &pixels[n * 4];
|
|
if (brightness) { // Return scaled color
|
|
return (((uint32_t)(p[wOffset] << 8) / brightness) << 24) |
|
|
(((uint32_t)(p[rOffset] << 8) / brightness) << 16) |
|
|
(((uint32_t)(p[gOffset] << 8) / brightness) << 8) |
|
|
((uint32_t)(p[bOffset] << 8) / brightness);
|
|
} else { // Return raw color
|
|
return ((uint32_t)p[wOffset] << 24) | ((uint32_t)p[rOffset] << 16) |
|
|
((uint32_t)p[gOffset] << 8) | (uint32_t)p[bOffset];
|
|
}
|
|
}
|
|
}
|
|
|
|
/*!
|
|
@brief Adjust output brightness. Does not immediately affect what's
|
|
currently displayed on the LEDs. The next call to show() will
|
|
refresh the LEDs at this level.
|
|
@param b Brightness setting, 0=minimum (off), 255=brightest.
|
|
@note This was intended for one-time use in one's setup() function,
|
|
not as an animation effect in itself. Because of the way this
|
|
library "pre-multiplies" LED colors in RAM, changing the
|
|
brightness is often a "lossy" operation -- what you write to
|
|
pixels isn't necessary the same as what you'll read back.
|
|
Repeated brightness changes using this function exacerbate the
|
|
problem. Smart programs therefore treat the strip as a
|
|
write-only resource, maintaining their own state to render each
|
|
frame of an animation, not relying on read-modify-write.
|
|
*/
|
|
void Adafruit_NeoPixel::setBrightness(uint8_t b) {
|
|
// Stored brightness value is different than what's passed.
|
|
// This simplifies the actual scaling math later, allowing a fast
|
|
// 8x8-bit multiply and taking the MSB. 'brightness' is a uint8_t,
|
|
// adding 1 here may (intentionally) roll over...so 0 = max brightness
|
|
// (color values are interpreted literally; no scaling), 1 = min
|
|
// brightness (off), 255 = just below max brightness.
|
|
uint8_t newBrightness = b + 1;
|
|
if (newBrightness != brightness) { // Compare against prior value
|
|
// Brightness has changed -- re-scale existing data in RAM,
|
|
// This process is potentially "lossy," especially when increasing
|
|
// brightness. The tight timing in the WS2811/WS2812 code means there
|
|
// aren't enough free cycles to perform this scaling on the fly as data
|
|
// is issued. So we make a pass through the existing color data in RAM
|
|
// and scale it (subsequent graphics commands also work at this
|
|
// brightness level). If there's a significant step up in brightness,
|
|
// the limited number of steps (quantization) in the old data will be
|
|
// quite visible in the re-scaled version. For a non-destructive
|
|
// change, you'll need to re-render the full strip data. C'est la vie.
|
|
uint8_t c, *ptr = pixels,
|
|
oldBrightness = brightness - 1; // De-wrap old brightness value
|
|
uint16_t scale;
|
|
if (oldBrightness == 0)
|
|
scale = 0; // Avoid /0
|
|
else if (b == 255)
|
|
scale = 65535 / oldBrightness;
|
|
else
|
|
scale = (((uint16_t)newBrightness << 8) - 1) / oldBrightness;
|
|
for (uint16_t i = 0; i < numBytes; i++) {
|
|
c = *ptr;
|
|
*ptr++ = (c * scale) >> 8;
|
|
}
|
|
brightness = newBrightness;
|
|
}
|
|
}
|
|
|
|
/*!
|
|
@brief Retrieve the last-set brightness value for the strip.
|
|
@return Brightness value: 0 = minimum (off), 255 = maximum.
|
|
*/
|
|
uint8_t Adafruit_NeoPixel::getBrightness(void) const { return brightness - 1; }
|
|
|
|
/*!
|
|
@brief Fill the whole NeoPixel strip with 0 / black / off.
|
|
*/
|
|
void Adafruit_NeoPixel::clear(void) { memset(pixels, 0, numBytes); }
|
|
|
|
// A 32-bit variant of gamma8() that applies the same function
|
|
// to all components of a packed RGB or WRGB value.
|
|
uint32_t Adafruit_NeoPixel::gamma32(uint32_t x) {
|
|
uint8_t *y = (uint8_t *)&x;
|
|
// All four bytes of a 32-bit value are filtered even if RGB (not WRGB),
|
|
// to avoid a bunch of shifting and masking that would be necessary for
|
|
// properly handling different endianisms (and each byte is a fairly
|
|
// trivial operation, so it might not even be wasting cycles vs a check
|
|
// and branch for the RGB case). In theory this might cause trouble *if*
|
|
// someone's storing information in the unused most significant byte
|
|
// of an RGB value, but this seems exceedingly rare and if it's
|
|
// encountered in reality they can mask values going in or coming out.
|
|
for (uint8_t i = 0; i < 4; i++)
|
|
y[i] = gamma8(y[i]);
|
|
return x; // Packed 32-bit return
|
|
}
|
|
|
|
/*!
|
|
@brief Fill NeoPixel strip with one or more cycles of hues.
|
|
Everyone loves the rainbow swirl so much, now it's canon!
|
|
@param first_hue Hue of first pixel, 0-65535, representing one full
|
|
cycle of the color wheel. Each subsequent pixel will
|
|
be offset to complete one or more cycles over the
|
|
length of the strip.
|
|
@param reps Number of cycles of the color wheel over the length
|
|
of the strip. Default is 1. Negative values can be
|
|
used to reverse the hue order.
|
|
@param saturation Saturation (optional), 0-255 = gray to pure hue,
|
|
default = 255.
|
|
@param brightness Brightness/value (optional), 0-255 = off to max,
|
|
default = 255. This is distinct and in combination
|
|
with any configured global strip brightness.
|
|
@param gammify If true (default), apply gamma correction to colors
|
|
for better appearance.
|
|
*/
|
|
void Adafruit_NeoPixel::rainbow(uint16_t first_hue, int8_t reps,
|
|
uint8_t saturation, uint8_t brightness, bool gammify) {
|
|
for (uint16_t i=0; i<numLEDs; i++) {
|
|
uint16_t hue = first_hue + (i * reps * 65536) / numLEDs;
|
|
uint32_t color = ColorHSV(hue, saturation, brightness);
|
|
if (gammify) color = gamma32(color);
|
|
setPixelColor(i, color);
|
|
}
|
|
}
|
|
|
|
/*!
|
|
@brief Convert pixel color order from string (e.g. "BGR") to NeoPixel
|
|
color order constant (e.g. NEO_BGR). This may be helpful for code
|
|
that initializes from text configuration rather than compile-time
|
|
constants.
|
|
@param v Input string. Should be reasonably sanitized (a 3- or 4-
|
|
character NUL-terminated string) or undefined behavior may
|
|
result (output is still a valid NeoPixel order constant, but
|
|
might not present as expected). Garbage in, garbage out.
|
|
@return One of the NeoPixel color order constants (e.g. NEO_BGR).
|
|
NEO_KHZ400 or NEO_KHZ800 bits are not included, nor needed (all
|
|
NeoPixels actually support 800 KHz it's been found, and this is
|
|
the default state if no KHZ bits set).
|
|
@note This function is declared static in the class so it can be called
|
|
without a NeoPixel object (since it's not likely been declared
|
|
in the code yet). Use Adafruit_NeoPixel::str2order().
|
|
*/
|
|
neoPixelType Adafruit_NeoPixel::str2order(const char *v) {
|
|
int8_t r = 0, g = 0, b = 0, w = -1;
|
|
if (v) {
|
|
char c;
|
|
for (uint8_t i=0; ((c = tolower(v[i]))); i++) {
|
|
if (c == 'r') r = i;
|
|
else if (c == 'g') g = i;
|
|
else if (c == 'b') b = i;
|
|
else if (c == 'w') w = i;
|
|
}
|
|
r &= 3;
|
|
}
|
|
if (w < 0) w = r; // If 'w' not specified, duplicate r bits
|
|
return (w << 6) | (r << 4) | ((g & 3) << 2) | (b & 3);
|
|
}
|