diff options
| author | mrfaptastic <12006953+mrfaptastic@users.noreply.github.com> | 2022-09-30 03:17:19 +0100 |
|---|---|---|
| committer | mrfaptastic <12006953+mrfaptastic@users.noreply.github.com> | 2022-09-30 03:17:19 +0100 |
| commit | ebe75dcaba0239d225243cdedd31aaf860abbd0a (patch) | |
| tree | fda21143906b93de687447af52c40f9329956d21 /src/ESP32-HUB75-MatrixPanel-I2S-DMA.cpp | |
| parent | 86063fe594cda6a572bd335e7e34af7c75226aad (diff) | |
Update to include S3 support.
Refactor tonnes of code. Double buffering not yet fully tested. PSRAM support doesn't work at all - garbled mess.
Enable in platformIO using:
build_flags =
-DSPIRAM_FRAMEBUFFER=1
Diffstat (limited to 'src/ESP32-HUB75-MatrixPanel-I2S-DMA.cpp')
| -rw-r--r-- | src/ESP32-HUB75-MatrixPanel-I2S-DMA.cpp | 886 |
1 files changed, 886 insertions, 0 deletions
diff --git a/src/ESP32-HUB75-MatrixPanel-I2S-DMA.cpp b/src/ESP32-HUB75-MatrixPanel-I2S-DMA.cpp new file mode 100644 index 0000000..6d8e521 --- /dev/null +++ b/src/ESP32-HUB75-MatrixPanel-I2S-DMA.cpp @@ -0,0 +1,886 @@ +#include "ESP32-HUB75-MatrixPanel-I2S-DMA.h" + +static const char* TAG = "MatrixPanel"; + +/* this replicates same function in rowBitStruct, but due to induced inlining it might be MUCH faster when used in tight loops + * while method from struct could be flushed out of instruction cache between loop cycles + * do NOT forget about buff_id param if using this + * + * faptastic note oct22: struct call is not inlined... commenting out this additional compile declaration + */ +//#define getRowDataPtr(row, _dpth, buff_id) &(dma_buff.rowBits[row]->data[_dpth * dma_buff.rowBits[row]->width + buff_id*(dma_buff.rowBits[row]->width * dma_buff.rowBits[row]->color_depth)]) + +bool MatrixPanel_I2S_DMA::allocateDMAmemory() +{ + + // Alright, theoretically we should be OK, so let us do this, so + // lets allocate a chunk of memory for each row (a row could span multiple panels if chaining is in place) + dma_buff.rowBits.reserve(ROWS_PER_FRAME); + + // iterate through number of rows + for (int malloc_num =0; malloc_num < ROWS_PER_FRAME; ++malloc_num) + { + auto ptr = std::make_shared<rowBitStruct>(PIXELS_PER_ROW, PIXEL_COLOR_DEPTH_BITS, m_cfg.double_buff); + + if (ptr->data == nullptr) + { + #if SERIAL_DEBUG + Serial.printf_P(PSTR("ERROR: Couldn't malloc rowBitStruct %d! Critical fail.\r\n"), malloc_num); + #endif + return false; + // TODO: should we release all previous rowBitStructs here??? + } + + dma_buff.rowBits.emplace_back(ptr); // save new rowBitStruct into rows vector + ++dma_buff.rows; + } + + // calculate the lowest LSBMSB_TRANSITION_BIT value that will fit in memory that will meet or exceed the configured refresh rate + while(1) { + int psPerClock = 1000000000000UL/m_cfg.i2sspeed; + int nsPerLatch = ((PIXELS_PER_ROW + CLKS_DURING_LATCH) * psPerClock) / 1000; + + // add time to shift out LSBs + LSB-MSB transition bit - this ignores fractions... + int nsPerRow = PIXEL_COLOR_DEPTH_BITS * nsPerLatch; + + // add time to shift out MSBs + for(int i=lsbMsbTransitionBit + 1; i<PIXEL_COLOR_DEPTH_BITS; i++) + nsPerRow += (1<<(i - lsbMsbTransitionBit - 1)) * (PIXEL_COLOR_DEPTH_BITS - i) * nsPerLatch; + + int nsPerFrame = nsPerRow * ROWS_PER_FRAME; + int actualRefreshRate = 1000000000UL/(nsPerFrame); + calculated_refresh_rate = actualRefreshRate; + + #if SERIAL_DEBUG + Serial.printf_P(PSTR("lsbMsbTransitionBit of %d gives %d Hz refresh: \r\n"), lsbMsbTransitionBit, actualRefreshRate); + #endif + + if (actualRefreshRate > m_cfg.min_refresh_rate) + break; + + if(lsbMsbTransitionBit < PIXEL_COLOR_DEPTH_BITS - 1) + lsbMsbTransitionBit++; + else + break; + } + + + + /*** + * Step 2a: lsbMsbTransition bit is now finalised - recalculate the DMA descriptor count required, which is used for + * memory allocation of the DMA linked list memory structure. + */ + int numDMAdescriptorsPerRow = 1; + for(int i=lsbMsbTransitionBit + 1; i<PIXEL_COLOR_DEPTH_BITS; i++) { + numDMAdescriptorsPerRow += (1<<(i - lsbMsbTransitionBit - 1)); + } + #if SERIAL_DEBUG + Serial.printf_P(PSTR("Recalculated number of DMA descriptors per row: %d\n"), numDMAdescriptorsPerRow); + #endif + + // Refer to 'DMA_LL_PAYLOAD_SPLIT' code in configureDMA() below to understand why this exists. + // numDMAdescriptorsPerRow is also used to calculate descount which is super important in i2s_parallel_config_t SoC DMA setup. + if ( dma_buff.rowBits[0]->size() > DMA_MAX ) { + + #if SERIAL_DEBUG + Serial.printf_P(PSTR("rowColorDepthStruct struct is too large, split DMA payload required. Adding %d DMA descriptors\n"), PIXEL_COLOR_DEPTH_BITS-1); + #endif + + numDMAdescriptorsPerRow += PIXEL_COLOR_DEPTH_BITS-1; + // Note: If numDMAdescriptorsPerRow is even just one descriptor too large, DMA linked list will not correctly loop. + } + + + /*** + * Step 3: Allocate memory for DMA linked list, linking up each framebuffer row in sequence for GPIO output. + */ + + // malloc the DMA linked list descriptors that i2s_parallel will need + desccount = numDMAdescriptorsPerRow * ROWS_PER_FRAME; + + dma_bus.allocate_dma_desc_memory(desccount); + +/* + //lldesc_t * dmadesc_a = (lldesc_t *)heap_caps_malloc(desccount * sizeof(lldesc_t), MALLOC_CAP_DMA); + dmadesc_a = (lldesc_t *)heap_caps_malloc(desccount * sizeof(lldesc_t), MALLOC_CAP_DMA); + assert("Can't allocate descriptor framebuffer a"); + if(!dmadesc_a) { +#if SERIAL_DEBUG + Serial.println(F("ERROR: Could not malloc descriptor framebuffer a.")); +#endif + return false; + } + + if (m_cfg.double_buff) // reserve space for second framebuffer linked list + { + //lldesc_t * dmadesc_b = (lldesc_t *)heap_caps_malloc(desccount * sizeof(lldesc_t), MALLOC_CAP_DMA); + dmadesc_b = (lldesc_t *)heap_caps_malloc(desccount * sizeof(lldesc_t), MALLOC_CAP_DMA); + assert("Could not malloc descriptor framebuffer b."); + if(!dmadesc_b) { +#if SERIAL_DEBUG + Serial.println(F("ERROR: Could not malloc descriptor framebuffer b.")); +#endif + return false; + } + } + */ + + // Just os we know + initialized = true; + + return true; + +} // end allocateDMAmemory() + + + +void MatrixPanel_I2S_DMA::configureDMA(const HUB75_I2S_CFG& _cfg) +{ + + // lldesc_t *previous_dmadesc_a = 0; + // lldesc_t *previous_dmadesc_b = 0; + int current_dmadescriptor_offset = 0; + + // HACK: If we need to split the payload in 1/2 so that it doesn't breach DMA_MAX, lets do it by the color_depth. + int num_dma_payload_color_depths = PIXEL_COLOR_DEPTH_BITS; + if ( dma_buff.rowBits[0]->size() > DMA_MAX ) { + num_dma_payload_color_depths = 1; + } + + // Fill DMA linked lists for both frames (as in, halves of the HUB75 panel) and if double buffering is enabled, link it up for both buffers. + for(int row = 0; row < ROWS_PER_FRAME; row++) { + + // first set of data is LSB through MSB, single pass (IF TOTAL SIZE < DMA_MAX) - all color bits are displayed once, which takes care of everything below and including LSBMSB_TRANSITION_BIT + // NOTE: size must be less than DMA_MAX - worst case for library: 16-bpp with 256 pixels per row would exceed this, need to break into two + //link_dma_desc(&dmadesc_a[current_dmadescriptor_offset], previous_dmadesc_a, dma_buff.rowBits[row]->getDataPtr(), dma_buff.rowBits[row]->size(num_dma_payload_color_depths)); + // previous_dmadesc_a = &dmadesc_a[current_dmadescriptor_offset]; + + dma_bus.create_dma_desc_link(dma_buff.rowBits[row]->getDataPtr(), dma_buff.rowBits[row]->size(num_dma_payload_color_depths)); + + if (m_cfg.double_buff) { + dma_bus.create_dma_desc_link(dma_buff.rowBits[row]->getDataPtr(), dma_buff.rowBits[row]->size(num_dma_payload_color_depths), true); + //link_dma_desc(&dmadesc_b[current_dmadescriptor_offset], previous_dmadesc_b, dma_buff.rowBits[row]->getDataPtr(0, 1), dma_buff.rowBits[row]->size(num_dma_payload_color_depths)); + //previous_dmadesc_b = &dmadesc_b[current_dmadescriptor_offset]; + } + + current_dmadescriptor_offset++; + + // If the number of pixels per row is too great for the size of a DMA payload, so we need to split what we were going to send above. + if ( dma_buff.rowBits[0]->size() > DMA_MAX ) + { + + for (int cd = 1; cd < PIXEL_COLOR_DEPTH_BITS; cd++) + { + dma_bus.create_dma_desc_link(dma_buff.rowBits[row]->getDataPtr(cd, 0), dma_buff.rowBits[row]->size(num_dma_payload_color_depths)); + + if (m_cfg.double_buff) { + dma_bus.create_dma_desc_link(dma_buff.rowBits[row]->getDataPtr(cd, 0), dma_buff.rowBits[row]->size(num_dma_payload_color_depths),true); + //link_dma_desc(&dmadesc_b[current_dmadescriptor_offset], previous_dmadesc_b, dma_buff.rowBits[row]->getDataPtr(cd, 1), dma_buff.rowBits[row]->size(num_dma_payload_color_depths)); + //previous_dmadesc_b = &dmadesc_b[current_dmadescriptor_offset]; + } + + current_dmadescriptor_offset++; + + } // additional linked list items + } // row depth struct + + + for(int i=lsbMsbTransitionBit + 1; i<PIXEL_COLOR_DEPTH_BITS; i++) + { + // binary time division setup: we need 2 of bit (LSBMSB_TRANSITION_BIT + 1) four of (LSBMSB_TRANSITION_BIT + 2), etc + // because we sweep through to MSB each time, it divides the number of times we have to sweep in half (saving linked list RAM) + // we need 2^(i - LSBMSB_TRANSITION_BIT - 1) == 1 << (i - LSBMSB_TRANSITION_BIT - 1) passes from i to MSB + + + for(int k=0; k < (1<<(i - lsbMsbTransitionBit - 1)); k++) + { + // link_dma_desc(&dmadesc_a[current_dmadescriptor_offset], previous_dmadesc_a, dma_buff.rowBits[row]->getDataPtr(i, 0), dma_buff.rowBits[row]->size(PIXEL_COLOR_DEPTH_BITS - i) ); +// previous_dmadesc_a = &dmadesc_a[current_dmadescriptor_offset]; + + dma_bus.create_dma_desc_link(dma_buff.rowBits[row]->getDataPtr(i, 0), dma_buff.rowBits[row]->size(PIXEL_COLOR_DEPTH_BITS - i) ); + + if (m_cfg.double_buff) { + dma_bus.create_dma_desc_link(dma_buff.rowBits[row]->getDataPtr(i, 0), dma_buff.rowBits[row]->size(PIXEL_COLOR_DEPTH_BITS - i), true ); + //link_dma_desc(&dmadesc_b[current_dmadescriptor_offset], previous_dmadesc_b, dma_buff.rowBits[row]->getDataPtr(i, 1), dma_buff.rowBits[row]->size(PIXEL_COLOR_DEPTH_BITS - i) ); + //previous_dmadesc_b = &dmadesc_b[current_dmadescriptor_offset]; + } + + current_dmadescriptor_offset++; + + } // end color depth ^ 2 linked list + } // end color depth loop + + } // end frame rows +/* + #if SERIAL_DEBUG + Serial.printf_P(PSTR("configureDMA(): Configured LL structure. %d DMA Linked List descriptors populated.\r\n"), current_dmadescriptor_offset); + + if ( desccount != current_dmadescriptor_offset) + { + Serial.printf_P(PSTR("configureDMA(): ERROR! Expected descriptor count of %d != actual DMA descriptors of %d!\r\n"), desccount, current_dmadescriptor_offset); + } + #endif + + //End markers for DMA LL + dmadesc_a[desccount-1].eof = 1; + dmadesc_a[desccount-1].qe.stqe_next=(lldesc_t*)&dmadesc_a[0]; + + if (m_cfg.double_buff) { + dmadesc_b[desccount-1].eof = 1; + dmadesc_b[desccount-1].qe.stqe_next=(lldesc_t*)&dmadesc_b[0]; + } else { + dmadesc_b = dmadesc_a; // link to same 'a' buffer + } + +#if SERIAL_DEBUG + Serial.println(F("Performing I2S setup:")); +#endif + + i2s_parallel_config_t dma_cfg = { + .gpio_bus={_cfg.gpio.r1, _cfg.gpio.g1, _cfg.gpio.b1, _cfg.gpio.r2, _cfg.gpio.g2, _cfg.gpio.b2, _cfg.gpio.lat, _cfg.gpio.oe, _cfg.gpio.a, _cfg.gpio.b, _cfg.gpio.c, _cfg.gpio.d, _cfg.gpio.e, -1, -1, -1}, + .gpio_clk=_cfg.gpio.clk, + .sample_rate=_cfg.i2sspeed, + .sample_width=ESP32_I2S_DMA_MODE, + .desccount_a=desccount, + .lldesc_a=dmadesc_a, + .desccount_b=desccount, + .lldesc_b=dmadesc_b, + .clkphase=_cfg.clkphase, + .int_ena_out_eof=_cfg.double_buff + }; + + // Setup I2S + //i2s_parallel_driver_install(ESP32_I2S_DEVICE, &dma_cfg); + +*/ + +// +// Setup DMA and Output to GPIO +// + auto bus_cfg = dma_bus.config(); // バス設定用の構造体を取得します。 + + //bus_cfg.i2s_port = I2S_NUM_0; // 使用するI2Sポートを選択 (I2S_NUM_0 or I2S_NUM_1) (ESP32のI2S LCDモードを使用します) + bus_cfg.bus_freq = _cfg.i2sspeed; + bus_cfg.pin_wr = m_cfg.gpio.clk; // WR を接続しているピン番号 + + bus_cfg.pin_d0 = m_cfg.gpio.r1; + bus_cfg.pin_d1 = m_cfg.gpio.g1; + bus_cfg.pin_d2 = m_cfg.gpio.b1; + bus_cfg.pin_d3 = m_cfg.gpio.r2; + bus_cfg.pin_d4 = m_cfg.gpio.g2; + bus_cfg.pin_d5 = m_cfg.gpio.b2; + bus_cfg.pin_d6 = m_cfg.gpio.lat; + bus_cfg.pin_d7 = m_cfg.gpio.oe; + bus_cfg.pin_d8 = m_cfg.gpio.a; + bus_cfg.pin_d9 = m_cfg.gpio.b; + bus_cfg.pin_d10 = m_cfg.gpio.c; + bus_cfg.pin_d11 = m_cfg.gpio.d; + bus_cfg.pin_d12 = m_cfg.gpio.e; + bus_cfg.pin_d13 = -1; + bus_cfg.pin_d14 = -1; + bus_cfg.pin_d15 = -1; + + dma_bus.config(bus_cfg); + + dma_bus.init(); + + dma_bus.dma_transfer_start(); + + + //i2s_parallel_send_dma(ESP32_I2S_DEVICE, &dmadesc_a[0]); + ESP_LOGI(TAG, "DMA setup completed"); + +} // end initMatrixDMABuff + + +/* There are 'bits' set in the frameStruct that we simply don't need to set every single time we change a pixel / DMA buffer co-ordinate. + * For example, the bits that determine the address lines, we don't need to set these every time. Once they're in place, and assuming we + * don't accidentally clear them, then we don't need to set them again. + * So to save processing, we strip this logic out to the absolute bare minimum, which is toggling only the R,G,B pixels (bits) per co-ord. + * + * Critical dependency: That 'updateMatrixDMABuffer(uint8_t red, uint8_t green, uint8_t blue)' has been run at least once over the + * entire frameBuffer to ensure all the non R,G,B bitmasks are in place (i.e. like OE, Address Lines etc.) + * + * Note: If you change the brightness with setBrightness() you MUST then clearScreen() and repaint / flush the entire framebuffer. + */ + +/** @brief - Update pixel at specific co-ordinate in the DMA buffer + * this is the main method used to update DMA buffer on pixel-by-pixel level so it must be fast, real fast! + * Let's put it into IRAM to avoid situations when it could be flushed out of instruction cache + * and had to be read from spi-flash over and over again. + * Yes, it is always a tradeoff between memory/speed/size, but compared to DMA-buffer size is not a big deal + */ +void IRAM_ATTR MatrixPanel_I2S_DMA::updateMatrixDMABuffer(int16_t x_coord, int16_t y_coord, uint8_t red, uint8_t green, uint8_t blue) +{ + if ( !initialized ) { + #if SERIAL_DEBUG + Serial.println(F("Cannot updateMatrixDMABuffer as setup failed!")); + #endif + return; + } + + /* 1) Check that the co-ordinates are within range, or it'll break everything big time. + * Valid co-ordinates are from 0 to (MATRIX_XXXX-1) + */ + if ( x_coord < 0 || y_coord < 0 || x_coord >= PIXELS_PER_ROW || y_coord >= m_cfg.mx_height) { + return; + } + + /* LED Brightness Compensation. Because if we do a basic "red & mask" for example, + * we'll NEVER send the dimmest possible colour, due to binary skew. + * i.e. It's almost impossible for color_depth_idx of 0 to be sent out to the MATRIX unless the 'value' of a color is exactly '1' + * https://ledshield.wordpress.com/2012/11/13/led-brightness-to-your-eye-gamma-correction-no/ + */ +#ifndef NO_CIE1931 + red = lumConvTab[red]; + green = lumConvTab[green]; + blue = lumConvTab[blue]; +#endif + + /* When using the drawPixel, we are obviously only changing the value of one x,y position, + * however, the two-scan panels paint TWO lines at the same time + * and this reflects the parallel in-DMA-memory data structure of uint16_t's that are getting + * pumped out at high speed. + * + * So we need to ensure we persist the bits (8 of them) of the uint16_t for the row we aren't changing. + * + * The DMA buffer order has also been reversed (refer to the last code in this function) + * so we have to check for this and check the correct position of the MATRIX_DATA_STORAGE_TYPE + * data. + */ + +#if defined (ESP32_THE_ORIG) + // We need to update the correct uint16_t in the rowBitStruct array, that gets sent out in parallel + // 16 bit parallel mode - Save the calculated value to the bitplane memory in reverse order to account for I2S Tx FIFO mode1 ordering + // Irrelevant for ESP32-S2 the way the FIFO ordering works is different - refer to page 679 of S2 technical reference manual + x_coord & 1U ? --x_coord : ++x_coord; +#endif + + + uint16_t _colorbitclear = BITMASK_RGB1_CLEAR, _colorbitoffset = 0; + + if (y_coord >= ROWS_PER_FRAME){ // if we are drawing to the bottom part of the panel + _colorbitoffset = BITS_RGB2_OFFSET; + _colorbitclear = BITMASK_RGB2_CLEAR; + y_coord -= ROWS_PER_FRAME; + } + + // Iterating through colour depth bits, which we assume are 8 bits per RGB subpixel (24bpp) + uint8_t color_depth_idx = PIXEL_COLOR_DEPTH_BITS; + do { + --color_depth_idx; +// uint8_t mask = (1 << (color_depth_idx COLOR_DEPTH_LESS_THAN_8BIT_ADJUST)); // expect 24 bit color (8 bits per RGB subpixel) + #if PIXEL_COLOR_DEPTH_BITS < 8 + uint8_t mask = (1 << (color_depth_idx+MASK_OFFSET)); // expect 24 bit color (8 bits per RGB subpixel) + #else + uint8_t mask = (1 << (color_depth_idx)); // expect 24 bit color (8 bits per RGB subpixel) + #endif + uint16_t RGB_output_bits = 0; + + /* Per the .h file, the order of the output RGB bits is: + * BIT_B2, BIT_G2, BIT_R2, BIT_B1, BIT_G1, BIT_R1 */ + RGB_output_bits |= (bool)(blue & mask); // --B + RGB_output_bits <<= 1; + RGB_output_bits |= (bool)(green & mask); // -BG + RGB_output_bits <<= 1; + RGB_output_bits |= (bool)(red & mask); // BGR + RGB_output_bits <<= _colorbitoffset; // shift color bits to the required position + + + // Get the contents at this address, + // it would represent a vector pointing to the full row of pixels for the specified color depth bit at Y coordinate + //ESP32_I2S_DMA_STORAGE_TYPE *p = getRowDataPtr(y_coord, color_depth_idx, back_buffer_id); + ESP32_I2S_DMA_STORAGE_TYPE *p = dma_buff.rowBits[y_coord]->getDataPtr(color_depth_idx, back_buffer_id); + + + // We need to update the correct uint16_t word in the rowBitStruct array pointing to a specific pixel at X - coordinate + p[x_coord] &= _colorbitclear; // reset RGB bits + p[x_coord] |= RGB_output_bits; // set new RGB bits + + } while(color_depth_idx); // end of color depth loop (8) +} // updateMatrixDMABuffer (specific co-ords change) + + +/* Update the entire buffer with a single specific colour - quicker */ +void MatrixPanel_I2S_DMA::updateMatrixDMABuffer(uint8_t red, uint8_t green, uint8_t blue) +{ + if ( !initialized ) return; + + /* https://ledshield.wordpress.com/2012/11/13/led-brightness-to-your-eye-gamma-correction-no/ */ +#ifndef NO_CIE1931 + red = lumConvTab[red]; + green = lumConvTab[green]; + blue = lumConvTab[blue]; +#endif + + for(uint8_t color_depth_idx=0; color_depth_idx<PIXEL_COLOR_DEPTH_BITS; color_depth_idx++) // color depth - 8 iterations + { + // let's precalculate RGB1 and RGB2 bits than flood it over the entire DMA buffer + uint16_t RGB_output_bits = 0; +// uint8_t mask = (1 << color_depth_idx COLOR_DEPTH_LESS_THAN_8BIT_ADJUST); // 24 bit color + #if PIXEL_COLOR_DEPTH_BITS < 8 + uint8_t mask = (1 << (color_depth_idx+MASK_OFFSET)); // expect 24 bit color (8 bits per RGB subpixel) + #else + uint8_t mask = (1 << (color_depth_idx)); // expect 24 bit color (8 bits per RGB subpixel) + #endif + + /* Per the .h file, the order of the output RGB bits is: + * BIT_B2, BIT_G2, BIT_R2, BIT_B1, BIT_G1, BIT_R1 */ + RGB_output_bits |= (bool)(blue & mask); // --B + RGB_output_bits <<= 1; + RGB_output_bits |= (bool)(green & mask); // -BG + RGB_output_bits <<= 1; + RGB_output_bits |= (bool)(red & mask); // BGR + + // Duplicate and shift across so we have have 6 populated bits of RGB1 and RGB2 pin values suitable for DMA buffer + RGB_output_bits |= RGB_output_bits << BITS_RGB2_OFFSET; //BGRBGR + + //Serial.printf("Fill with: 0x%#06x\n", RGB_output_bits); + + // iterate rows + int matrix_frame_parallel_row = dma_buff.rowBits.size(); + do { + --matrix_frame_parallel_row; + + // The destination for the pixel row bitstream + //ESP32_I2S_DMA_STORAGE_TYPE *p = getRowDataPtr(matrix_frame_parallel_row, color_depth_idx, back_buffer_id); + ESP32_I2S_DMA_STORAGE_TYPE *p = dma_buff.rowBits[matrix_frame_parallel_row]->getDataPtr(color_depth_idx, back_buffer_id); + + // iterate pixels in a row + int x_coord=dma_buff.rowBits[matrix_frame_parallel_row]->width; + do { + --x_coord; + p[x_coord] &= BITMASK_RGB12_CLEAR; // reset color bits + p[x_coord] |= RGB_output_bits; // set new color bits + } while(x_coord); + + } while(matrix_frame_parallel_row); // end row iteration + } // colour depth loop (8) +} // updateMatrixDMABuffer (full frame paint) + +/** + * @brief - clears and reinitializes color/control data in DMA buffs + * When allocated, DMA buffs might be dirty, so we need to blank it and initialize ABCDE,LAT,OE control bits. + * Those control bits are constants during the entire DMA sweep and never changed when updating just pixel color data + * so we could set it once on DMA buffs initialization and forget. + * This effectively clears buffers to blank BLACK and makes it ready to display output. + * (Brightness control via OE bit manipulation is another case) + */ +void MatrixPanel_I2S_DMA::clearFrameBuffer(bool _buff_id){ + if (!initialized) + return; + + // we start with iterating all rows in dma_buff structure + int row_idx = dma_buff.rowBits.size(); + do { + --row_idx; + + ESP32_I2S_DMA_STORAGE_TYPE* row = dma_buff.rowBits[row_idx]->getDataPtr(0, _buff_id); // set pointer to the HEAD of a buffer holding data for the entire matrix row + + ESP32_I2S_DMA_STORAGE_TYPE abcde = (ESP32_I2S_DMA_STORAGE_TYPE)row_idx; + abcde <<= BITS_ADDR_OFFSET; // shift row y-coord to match ABCDE bits in vector from 8 to 12 + + // get last pixel index in a row of all colordepths + int x_pixel = dma_buff.rowBits[row_idx]->width * dma_buff.rowBits[row_idx]->color_depth; + //Serial.printf(" from pixel %d, ", x_pixel); + + // fill all x_pixels except color_index[0] (LSB) ones, this also clears all color data to 0's black + do { + --x_pixel; + + if ( m_cfg.driver == HUB75_I2S_CFG::SM5266P) { + // modifications here for row shift register type SM5266P + // https://github.com/mrfaptastic/ESP32-HUB75-MatrixPanel-I2S-DMA/issues/164 + row[x_pixel] = abcde & (0x18 << BITS_ADDR_OFFSET); // mask out the bottom 3 bits which are the clk di bk inputs + } else { + row[x_pixel] = abcde; + } + + } while(x_pixel!=dma_buff.rowBits[row_idx]->width); + + // color_index[0] (LSB) x_pixels must be "marked" with a previous's row address, 'cause it is used to display + // previous row while we pump in LSB's for a new row + abcde = ((ESP32_I2S_DMA_STORAGE_TYPE)row_idx-1) << BITS_ADDR_OFFSET; + do { + --x_pixel; + + if ( m_cfg.driver == HUB75_I2S_CFG::SM5266P) { + // modifications here for row shift register type SM5266P + // https://github.com/mrfaptastic/ESP32-HUB75-MatrixPanel-I2S-DMA/issues/164 + row[x_pixel] = abcde & (0x18 << BITS_ADDR_OFFSET); // mask out the bottom 3 bits which are the clk di bk inputs + } else { + row[x_pixel] = abcde; + } + //row[x_pixel] = abcde; + } while(x_pixel); + + + // modifications here for row shift register type SM5266P + // https://github.com/mrfaptastic/ESP32-HUB75-MatrixPanel-I2S-DMA/issues/164 + if ( m_cfg.driver == HUB75_I2S_CFG::SM5266P) { + uint16_t serialCount; + uint16_t latch; + x_pixel = dma_buff.rowBits[row_idx]->width - 16; // come back 8*2 pixels to allow for 8 writes + serialCount = 8; + do{ + serialCount--; + latch = row[x_pixel] | (((((ESP32_I2S_DMA_STORAGE_TYPE)row_idx) % 8) == serialCount) << 1) << BITS_ADDR_OFFSET; // data on 'B' + row[x_pixel++] = latch| (0x05<< BITS_ADDR_OFFSET); // clock high on 'A'and BK high for update + row[x_pixel++] = latch| (0x04<< BITS_ADDR_OFFSET); // clock low on 'A'and BK high for update + } while (serialCount); + } // end SM5266P + + + // let's set LAT/OE control bits for specific pixels in each color_index subrows + // Need to consider the original ESP32's (WROOM) DMA TX FIFO reordering of bytes... + uint8_t coloridx = dma_buff.rowBits[row_idx]->color_depth; + do { + --coloridx; + + // switch pointer to a row for a specific color index + row = dma_buff.rowBits[row_idx]->getDataPtr(coloridx, _buff_id); + + #if defined(ESP32_THE_ORIG) + // We need to update the correct uint16_t in the rowBitStruct array, that gets sent out in parallel + // 16 bit parallel mode - Save the calculated value to the bitplane memory in reverse order to account for I2S Tx FIFO mode1 ordering + // Irrelevant for ESP32-S2 the way the FIFO ordering works is different - refer to page 679 of S2 technical reference manual + row[dma_buff.rowBits[row_idx]->width - 2] |= BIT_LAT; // -2 in the DMA array is actually -1 when it's reordered by TX FIFO + #else + // -1 works better on ESP32-S2 ? Because bytes get sent out in order... + row[dma_buff.rowBits[row_idx]->width - 1] |= BIT_LAT; // -1 pixel to compensate array index starting at 0 + #endif + + // need to disable OE before/after latch to hide row transition + // Should be one clock or more before latch, otherwise can get ghosting + uint8_t _blank = m_cfg.latch_blanking; + do { + --_blank; + + #if defined(ESP32_THE_ORIG) + // Original ESP32 WROOM FIFO Ordering Sucks + uint8_t _blank_row_tx_fifo_tmp = 0 + _blank; + (_blank_row_tx_fifo_tmp & 1U) ? --_blank_row_tx_fifo_tmp : ++_blank_row_tx_fifo_tmp; + row[_blank_row_tx_fifo_tmp] |= BIT_OE; + + _blank_row_tx_fifo_tmp = dma_buff.rowBits[row_idx]->width - _blank - 1; // (LAT pulse is (width-2) -1 pixel to compensate array index starting at 0 + (_blank_row_tx_fifo_tmp & 1U) ? --_blank_row_tx_fifo_tmp : ++_blank_row_tx_fifo_tmp; + row[_blank_row_tx_fifo_tmp] |= BIT_OE; + #else + row[0 + _blank] |= BIT_OE; + row[dma_buff.rowBits[row_idx]->width - _blank - 1 ] |= BIT_OE; // (LAT pulse is (width-2) -1 pixel to compensate array index starting at 0 + #endif + + } while (_blank); + + } while(coloridx); + + } while(row_idx); +} + +/** + * @brief - reset OE bits in DMA buffer in a way to control brightness + * @param brt - brightness level from 0 to row_width + * @param _buff_id - buffer id to control + */ +void MatrixPanel_I2S_DMA::brtCtrlOE(int brt, const bool _buff_id){ + if (!initialized) + return; + + if (brt > PIXELS_PER_ROW - (MAX_LAT_BLANKING + 2)) // can't control values larger than (row_width - latch_blanking) to avoid ongoing issues being raised about brightness and ghosting. + brt = PIXELS_PER_ROW - (MAX_LAT_BLANKING + 2); // +2 for a bit of buffer... + + if (brt < 0) + brt = 0; + + // start with iterating all rows in dma_buff structure + int row_idx = dma_buff.rowBits.size(); + do { + --row_idx; + + // let's set OE control bits for specific pixels in each color_index subrows + uint8_t coloridx = dma_buff.rowBits[row_idx]->color_depth; + do { + --coloridx; + + // switch pointer to a row for a specific color index + ESP32_I2S_DMA_STORAGE_TYPE* row = dma_buff.rowBits[row_idx]->getDataPtr(coloridx, _buff_id); + + int x_coord = dma_buff.rowBits[row_idx]->width; + do { + --x_coord; + + // clear OE bit for all other pixels + row[x_coord] &= BITMASK_OE_CLEAR; + + // Brightness control via OE toggle - disable matrix output at specified x_coord + if((coloridx > lsbMsbTransitionBit || !coloridx) && ((x_coord) >= brt)){ + row[x_coord] |= BIT_OE; // Disable output after this point. + continue; + } + // special case for the bits *after* LSB through (lsbMsbTransitionBit) - OE is output after data is shifted, so need to set OE to fractional brightness + if(coloridx && coloridx <= lsbMsbTransitionBit) { + // divide brightness in half for each bit below lsbMsbTransitionBit + int lsbBrightness = brt >> (lsbMsbTransitionBit - coloridx + 1); + if((x_coord) >= lsbBrightness) { + row[x_coord] |= BIT_OE; // Disable output after this point. + continue; + } + } + + + } while(x_coord); + + // need to disable OE before/after latch to hide row transition + // Should be one clock or more before latch, otherwise can get ghosting + uint8_t _blank = m_cfg.latch_blanking; + do { + --_blank; + + #if defined(ESP32_THE_ORIG) + // Original ESP32 WROOM FIFO Ordering Sucks + uint8_t _blank_row_tx_fifo_tmp = 0 + _blank; + (_blank_row_tx_fifo_tmp & 1U) ? --_blank_row_tx_fifo_tmp : ++_blank_row_tx_fifo_tmp; + row[_blank_row_tx_fifo_tmp] |= BIT_OE; + #else + row[0 + _blank] |= BIT_OE; + #endif + + //row[0 + _blank] |= BIT_OE; + // no need, has been done already + //row[dma_buff.rowBits[row_idx]->width - _blank - 3 ] |= BIT_OE; // (LAT pulse is (width-2) -1 pixel to compensate array index starting at 0 + } while (_blank); + + } while(coloridx); + } while(row_idx); +} + + +/* + * overload for compatibility + */ + +bool MatrixPanel_I2S_DMA::begin(int r1, int g1, int b1, int r2, int g2, int b2, int a, int b, int c, int d, int e, int lat, int oe, int clk) { + + // RGB + m_cfg.gpio.r1 = r1; m_cfg.gpio.g1 = g1; m_cfg.gpio.b1 = b1; + m_cfg.gpio.r2 = r2; m_cfg.gpio.g2 = g2; m_cfg.gpio.b2 = b2; + + // Line Select + m_cfg.gpio.a = a; m_cfg.gpio.b = b; m_cfg.gpio.c = c; + m_cfg.gpio.d = d; m_cfg.gpio.e = e; + + // Clock & Control + m_cfg.gpio.lat = lat; m_cfg.gpio.oe = oe; m_cfg.gpio.clk = clk; + + return begin(); +} + + +/** + * @brief - Sets how many clock cycles to blank OE before/after LAT signal change + * @param uint8_t pulses - clocks before/after OE + * default is DEFAULT_LAT_BLANKING + * Max is MAX_LAT_BLANKING + * @returns - new value for m_cfg.latch_blanking + */ +uint8_t MatrixPanel_I2S_DMA::setLatBlanking(uint8_t pulses){ + if (pulses > MAX_LAT_BLANKING) + pulses = MAX_LAT_BLANKING; + + if (!pulses) + pulses = DEFAULT_LAT_BLANKING; + + m_cfg.latch_blanking = pulses; + setPanelBrightness(brightness); // set brightness to reset OE bits to the values matching new LAT blanking setting + return m_cfg.latch_blanking; +} + + +#ifndef NO_FAST_FUNCTIONS +/** + * @brief - update DMA buff drawing horizontal line at specified coordinates + * @param x_ccord - line start coordinate x + * @param y_ccord - line start coordinate y + * @param l - line length + * @param r,g,b, - RGB888 color + */ +void MatrixPanel_I2S_DMA::hlineDMA(int16_t x_coord, int16_t y_coord, int16_t l, uint8_t red, uint8_t green, uint8_t blue){ + if ( !initialized ) + return; + + if ( x_coord < 0 || y_coord < 0 || l < 1 || x_coord >= PIXELS_PER_ROW || y_coord >= m_cfg.mx_height) + return; + + + l = ( (x_coord + l) >= PIXELS_PER_ROW ) ? (PIXELS_PER_ROW - x_coord):l; + + //if (x_coord+l > PIXELS_PER_ROW) +// l = PIXELS_PER_ROW - x_coord + 1; // reset width to end of row + + /* LED Brightness Compensation */ +#ifndef NO_CIE1931 + red = lumConvTab[red]; + green = lumConvTab[green]; + blue = lumConvTab[blue]; +#endif + + uint16_t _colorbitclear = BITMASK_RGB1_CLEAR, _colorbitoffset = 0; + + if (y_coord >= ROWS_PER_FRAME){ // if we are drawing to the bottom part of the panel + _colorbitoffset = BITS_RGB2_OFFSET; + _colorbitclear = BITMASK_RGB2_CLEAR; + y_coord -= ROWS_PER_FRAME; + } + + // Iterating through color depth bits (8 iterations) + uint8_t color_depth_idx = PIXEL_COLOR_DEPTH_BITS; + do { + --color_depth_idx; + + // let's precalculate RGB1 and RGB2 bits than flood it over the entire DMA buffer + uint16_t RGB_output_bits = 0; +// uint8_t mask = (1 << color_depth_idx COLOR_DEPTH_LESS_THAN_8BIT_ADJUST); + #if PIXEL_COLOR_DEPTH_BITS < 8 + uint8_t mask = (1 << (color_depth_idx+MASK_OFFSET)); // expect 24 bit color (8 bits per RGB subpixel) + #else + uint8_t mask = (1 << (color_depth_idx)); // expect 24 bit color (8 bits per RGB subpixel) + #endif + + /* Per the .h file, the order of the output RGB bits is: + * BIT_B2, BIT_G2, BIT_R2, BIT_B1, BIT_G1, BIT_R1 */ + RGB_output_bits |= (bool)(blue & mask); // --B + RGB_output_bits <<= 1; + RGB_output_bits |= (bool)(green & mask); // -BG + RGB_output_bits <<= 1; + RGB_output_bits |= (bool)(red & mask); // BGR + RGB_output_bits <<= _colorbitoffset; // shift color bits to the required position + + // Get the contents at this address, + // it would represent a vector pointing to the full row of pixels for the specified color depth bit at Y coordinate + ESP32_I2S_DMA_STORAGE_TYPE *p = dma_buff.rowBits[y_coord]->getDataPtr(color_depth_idx, back_buffer_id); + // inlined version works slower here, dunno why :( + // ESP32_I2S_DMA_STORAGE_TYPE *p = getRowDataPtr(y_coord, color_depth_idx, back_buffer_id); + + int16_t _l = l; + do { // iterate pixels in a row + int16_t _x = x_coord + --_l; + +#if defined(ESP32_THE_ORIG) + // Save the calculated value to the bitplane memory in reverse order to account for I2S Tx FIFO mode1 ordering + uint16_t &v = p[_x & 1U ? --_x : ++_x]; +#else + // ESP 32 doesn't need byte flipping for TX FIFO. + uint16_t &v = p[_x]; +#endif + + v &= _colorbitclear; // reset color bits + v |= RGB_output_bits; // set new color bits + } while(_l); // iterate pixels in a row + } while(color_depth_idx); // end of color depth loop (8) +} // hlineDMA() + + +/** + * @brief - update DMA buff drawing vertical line at specified coordinates + * @param x_ccord - line start coordinate x + * @param y_ccord - line start coordinate y + * @param l - line length + * @param r,g,b, - RGB888 color + */ +void MatrixPanel_I2S_DMA::vlineDMA(int16_t x_coord, int16_t y_coord, int16_t l, uint8_t red, uint8_t green, uint8_t blue){ + if ( !initialized ) + return; + + if ( x_coord < 0 || y_coord < 0 || l < 1 || x_coord >= PIXELS_PER_ROW || y_coord >= m_cfg.mx_height) + return; + + // check for a length that goes beyond the height of the screen! Array out of bounds dma memory changes = screwed output #163 + l = ( (y_coord + l) >= m_cfg.mx_height ) ? (m_cfg.mx_height - y_coord):l; + //if (y_coord + l > m_cfg.mx_height) + /// l = m_cfg.mx_height - y_coord + 1; // reset width to end of col + + /* LED Brightness Compensation */ +#ifndef NO_CIE1931 + red = lumConvTab[red]; + green = lumConvTab[green]; + blue = lumConvTab[blue]; +#endif + +#if defined(ESP32_THE_ORIG) + // Save the calculated value to the bitplane memory in reverse order to account for I2S Tx FIFO mode1 ordering + x_coord & 1U ? --x_coord : ++x_coord; +#endif + + uint8_t color_depth_idx = PIXEL_COLOR_DEPTH_BITS; + do { // Iterating through color depth bits (8 iterations) + --color_depth_idx; + + // let's precalculate RGB1 and RGB2 bits than flood it over the entire DMA buffer +// uint8_t mask = (1 << color_depth_idx COLOR_DEPTH_LESS_THAN_8BIT_ADJUST); + #if PIXEL_COLOR_DEPTH_BITS < 8 + uint8_t mask = (1 << (color_depth_idx+MASK_OFFSET)); // expect 24 bit color (8 bits per RGB subpixel) + #else + uint8_t mask = (1 << (color_depth_idx)); // expect 24 bit color (8 bits per RGB subpixel) + #endif + uint16_t RGB_output_bits = 0; + + /* Per the .h file, the order of the output RGB bits is: + * BIT_B2, BIT_G2, BIT_R2, BIT_B1, BIT_G1, BIT_R1 */ + RGB_output_bits |= (bool)(blue & mask); // --B + RGB_output_bits <<= 1; + RGB_output_bits |= (bool)(green & mask); // -BG + RGB_output_bits <<= 1; + RGB_output_bits |= (bool)(red & mask); // BGR + + int16_t _l = 0, _y = y_coord; + uint16_t _colorbitclear = BITMASK_RGB1_CLEAR; + do { // iterate pixels in a column + + if (_y >= ROWS_PER_FRAME){ // if y-coord overlapped bottom-half panel + _y -= ROWS_PER_FRAME; + _colorbitclear = BITMASK_RGB2_CLEAR; + RGB_output_bits <<= BITS_RGB2_OFFSET; + } + + // Get the contents at this address, + // it would represent a vector pointing to the full row of pixels for the specified color depth bit at Y coordinate + //ESP32_I2S_DMA_STORAGE_TYPE *p = getRowDataPtr(_y, color_depth_idx, back_buffer_id); + ESP32_I2S_DMA_STORAGE_TYPE *p = dma_buff.rowBits[_y]->getDataPtr(color_depth_idx, back_buffer_id); + + p[x_coord] &= _colorbitclear; // reset RGB bits + p[x_coord] |= RGB_output_bits; // set new RGB bits + ++_y; + } while(++_l!=l); // iterate pixels in a col + } while(color_depth_idx); // end of color depth loop (8) +} // vlineDMA() + + +/** + * @brief - update DMA buff drawing a rectangular at specified coordinates + * this works much faster than multiple consecutive per-pixel calls to updateMatrixDMABuffer() + * @param int16_t x, int16_t y - coordinates of a top-left corner + * @param int16_t w, int16_t h - width and height of a rectangular, min is 1 px + * @param uint8_t r - RGB888 color + * @param uint8_t g - RGB888 color + * @param uint8_t b - RGB888 color + */ +void MatrixPanel_I2S_DMA::fillRectDMA(int16_t x, int16_t y, int16_t w, int16_t h, uint8_t r, uint8_t g, uint8_t b){ + + // h-lines are >2 times faster than v-lines + // so will use it only for tall rects with h >2w + if (h>2*w){ + // draw using v-lines + do { + --w; + vlineDMA(x+w, y, h, r,g,b); + } while(w); + } else { + // draw using h-lines + do { + --h; + hlineDMA(x, y+h, w, r,g,b); + } while(h); + } +} + +#endif // NO_FAST_FUNCTIONS |
