1 // Copyright (C) 2013 Michael McMaster <michael@codesrc.com>
\r
3 // This file is part of SCSI2SD.
\r
5 // SCSI2SD is free software: you can redistribute it and/or modify
\r
6 // it under the terms of the GNU General Public License as published by
\r
7 // the Free Software Foundation, either version 3 of the License, or
\r
8 // (at your option) any later version.
\r
10 // SCSI2SD is distributed in the hope that it will be useful,
\r
11 // but WITHOUT ANY WARRANTY; without even the implied warranty of
\r
12 // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
\r
13 // GNU General Public License for more details.
\r
15 // You should have received a copy of the GNU General Public License
\r
16 // along with SCSI2SD. If not, see <http://www.gnu.org/licenses/>.
\r
18 #include "stm32f2xx.h"
\r
19 #include "stm32f2xx_hal.h"
\r
20 #include "stm32f2xx_hal_dma.h"
\r
23 #include "scsiPhy.h"
\r
32 // Assumes a 96MHz fpga clock.
\r
33 // 2:0 Deskew count, 55ns
\r
34 // 6:4 Hold count, 53ns
\r
35 // 3:0 Assertion count, 80ns
\r
36 #define SCSI_DEFAULT_DESKEW 0x6
\r
37 #define SCSI_DEFAULT_TIMING ((0x5 << 4) | 0x8)
\r
40 // 2:0 Deskew count, 25ns
\r
41 // 6:4 Hold count, 33ns
\r
42 // 3:0 Assertion count, 30ns
\r
43 #define SCSI_FAST10_DESKEW 3
\r
44 #define SCSI_FAST10_TIMING ((0x3 << 4) | 0x3)
\r
47 // 2:0 Deskew count, 12ns
\r
48 // 6:4 Hold count, 17ns
\r
49 // 3:0 Assertion count, 15ns
\r
50 #define SCSI_FAST20_DESKEW 2
\r
51 #define SCSI_FAST20_TIMING ((0x2 << 4) | 0x2)
\r
53 // Private DMA variables.
\r
54 static int dmaInProgress = 0;
\r
56 static DMA_HandleTypeDef memToFSMC;
\r
57 static DMA_HandleTypeDef fsmcToMem;
\r
60 volatile uint8_t scsiRxDMAComplete;
\r
61 volatile uint8_t scsiTxDMAComplete;
\r
64 CY_ISR_PROTO(scsiRxCompleteISR);
\r
65 CY_ISR(scsiRxCompleteISR)
\r
67 traceIrq(trace_scsiRxCompleteISR);
\r
68 scsiRxDMAComplete = 1;
\r
71 CY_ISR_PROTO(scsiTxCompleteISR);
\r
72 CY_ISR(scsiTxCompleteISR)
\r
74 traceIrq(trace_scsiTxCompleteISR);
\r
75 scsiTxDMAComplete = 1;
\r
79 uint8_t scsiPhyFifoSel = 0; // global
\r
81 // scsi IRQ handler is initialised by the STM32 HAL. Connected to
\r
83 // Note: naming is important to ensure this function is listed in the
\r
85 void EXTI4_IRQHandler()
\r
87 traceIrq(trace_scsiResetISR);
\r
89 // Make sure that interrupt flag is set
\r
90 if (__HAL_GPIO_EXTI_GET_IT(GPIO_PIN_4) != RESET) {
\r
92 // Clear interrupt flag
\r
93 __HAL_GPIO_EXTI_CLEAR_IT(GPIO_PIN_4);
\r
95 scsiDev.resetFlag = scsiDev.resetFlag || scsiStatusRST();
\r
96 // TODO grab SEL status as well
\r
101 static void assertFail()
\r
113 scsiSetDataCount(uint32_t count)
\r
115 *SCSI_DATA_CNT_HI = count >> 8;
\r
116 *SCSI_DATA_CNT_LO = count & 0xff;
\r
117 *SCSI_DATA_CNT_SET = 1;
\r
124 if (!scsiPhyFifoAltEmpty()) {
\r
125 // Force a lock-up.
\r
129 scsiSetDataCount(1);
\r
131 trace(trace_spinPhyRxFifo);
\r
132 while (!scsiPhyComplete() && likely(!scsiDev.resetFlag)) {}
\r
134 uint8_t val = scsiPhyRx();
\r
135 // TODO scsiDev.parityError = scsiDev.parityError || SCSI_Parity_Error_Read();
\r
138 if (!scsiPhyFifoEmpty()) {
\r
140 uint8_t k __attribute((unused));
\r
141 while (!scsiPhyFifoEmpty()) { k = scsiPhyRx(); ++j; }
\r
143 // Force a lock-up.
\r
152 scsiReadPIO(uint8_t* data, uint32_t count)
\r
154 uint16_t* fifoData = (uint16_t*)data;
\r
155 for (int i = 0; i < (count + 1) / 2; ++i)
\r
157 fifoData[i] = scsiPhyRx(); // TODO ASSUMES LITTLE ENDIAN
\r
159 // TODO scsiDev.parityError = scsiDev.parityError || SCSI_Parity_Error_Read();
\r
163 scsiReadDMA(uint8_t* data, uint32_t count)
\r
165 // Prepare DMA transfer
\r
167 trace(trace_doRxSingleDMA);
\r
169 scsiTxDMAComplete = 1; // TODO not used much
\r
170 scsiRxDMAComplete = 0; // TODO not used much
\r
174 (uint32_t) SCSI_FIFO_DATA,
\r
182 int complete = __HAL_DMA_GET_COUNTER(&fsmcToMem) == 0;
\r
183 complete = complete && (HAL_DMA_PollForTransfer(&fsmcToMem, HAL_DMA_FULL_TRANSFER, 0xffffffff) == HAL_OK);
\r
186 scsiTxDMAComplete = 1; // TODO MM FIX IRQ
\r
187 scsiRxDMAComplete = 1;
\r
191 // TODO MM scsiDev.parityError = scsiDev.parityError || SCSI_Parity_Error_Read();
\r
203 scsiRead(uint8_t* data, uint32_t count)
\r
208 uint32_t chunk = ((count - i) > SCSI_FIFO_DEPTH)
\r
209 ? SCSI_FIFO_DEPTH : (count - i);
\r
210 #ifdef SCSI_FSMC_DMA
\r
213 // DMA is doing 32bit transfers.
\r
214 chunk = chunk & 0xFFFFFFF8;
\r
217 scsiSetDataCount(chunk);
\r
219 while (i < count && likely(!scsiDev.resetFlag))
\r
221 while (!scsiPhyComplete() && likely(!scsiDev.resetFlag)) {}
\r
224 uint32_t nextChunk = ((count - i - chunk) > SCSI_FIFO_DEPTH)
\r
225 ? SCSI_FIFO_DEPTH : (count - i - chunk);
\r
226 #ifdef SCSI_FSMC_DMA
\r
227 if (nextChunk >= 16)
\r
229 nextChunk = nextChunk & 0xFFFFFFF8;
\r
234 scsiSetDataCount(nextChunk);
\r
237 #ifdef SCSI_FSMC_DMA
\r
241 scsiReadPIO(data + i, chunk);
\r
243 #ifdef SCSI_FSMC_DMA
\r
246 scsiReadDMA(data + i, chunk);
\r
248 trace(trace_spinReadDMAPoll);
\r
250 while (!scsiReadDMAPoll() && likely(!scsiDev.resetFlag))
\r
261 if (!scsiPhyFifoEmpty() || !scsiPhyFifoAltEmpty()) {
\r
263 while (!scsiPhyFifoEmpty()) { scsiPhyRx(); ++j; }
\r
266 while (!scsiPhyFifoEmpty()) { scsiPhyRx(); ++k; }
\r
267 // Force a lock-up.
\r
274 scsiWriteByte(uint8_t value)
\r
277 if (!scsiPhyFifoEmpty()) {
\r
278 // Force a lock-up.
\r
282 trace(trace_spinPhyTxFifo);
\r
286 scsiSetDataCount(1);
\r
288 trace(trace_spinTxComplete);
\r
289 while (!scsiPhyComplete() && likely(!scsiDev.resetFlag)) {}
\r
292 if (!scsiPhyFifoAltEmpty()) {
\r
293 // Force a lock-up.
\r
300 scsiWritePIO(const uint8_t* data, uint32_t count)
\r
302 uint16_t* fifoData = (uint16_t*)data;
\r
303 for (int i = 0; i < (count + 1) / 2; ++i)
\r
305 scsiPhyTx(fifoData[i]);
\r
310 scsiWriteDMA(const uint8_t* data, uint32_t count)
\r
312 // Prepare DMA transfer
\r
314 trace(trace_doTxSingleDMA);
\r
316 scsiTxDMAComplete = 0;
\r
317 scsiRxDMAComplete = 1;
\r
322 (uint32_t) SCSI_FIFO_DATA,
\r
329 int complete = __HAL_DMA_GET_COUNTER(&memToFSMC) == 0;
\r
330 complete = complete && (HAL_DMA_PollForTransfer(&memToFSMC, HAL_DMA_FULL_TRANSFER, 0xffffffff) == HAL_OK);
\r
333 scsiTxDMAComplete = 1; // TODO MM FIX IRQ
\r
334 scsiRxDMAComplete = 1;
\r
346 scsiWrite(const uint8_t* data, uint32_t count)
\r
349 while (i < count && likely(!scsiDev.resetFlag))
\r
351 uint32_t chunk = ((count - i) > SCSI_FIFO_DEPTH)
\r
352 ? SCSI_FIFO_DEPTH : (count - i);
\r
355 if (!scsiPhyFifoEmpty()) {
\r
356 // Force a lock-up.
\r
361 #ifdef SCSI_FSMC_DMA
\r
365 scsiWritePIO(data + i, chunk);
\r
367 #ifdef SCSI_FSMC_DMA
\r
370 // DMA is doing 32bit transfers.
\r
371 chunk = chunk & 0xFFFFFFF8;
\r
372 scsiWriteDMA(data + i, chunk);
\r
374 trace(trace_spinReadDMAPoll);
\r
376 while (!scsiWriteDMAPoll() && likely(!scsiDev.resetFlag))
\r
382 while (!scsiPhyComplete() && likely(!scsiDev.resetFlag))
\r
387 if (!scsiPhyFifoAltEmpty()) {
\r
388 // Force a lock-up.
\r
394 scsiSetDataCount(chunk);
\r
397 while (!scsiPhyComplete() && likely(!scsiDev.resetFlag))
\r
402 if (!scsiPhyFifoAltEmpty()) {
\r
403 // Force a lock-up.
\r
409 static inline void busSettleDelay(void)
\r
411 // Data Release time (switching IO) = 400ns
\r
412 // + Bus Settle time (switching phase) = 400ns.
\r
413 s2s_delay_us(1); // Close enough.
\r
416 void scsiEnterBusFree()
\r
418 *SCSI_CTRL_BSY = 0x00;
\r
419 // We now have a Bus Clear Delay of 800ns to release remaining signals.
\r
420 *SCSI_CTRL_PHASE = 0;
\r
423 void scsiEnterPhase(int phase)
\r
425 // ANSI INCITS 362-2002 SPI-3 10.7.1:
\r
426 // Phase changes are not allowed while REQ or ACK is asserted.
\r
427 while (likely(!scsiDev.resetFlag) && scsiStatusACK()) {}
\r
429 int newPhase = phase > 0 ? phase : 0;
\r
430 int oldPhase = *SCSI_CTRL_PHASE;
\r
432 if (!scsiDev.resetFlag && (!scsiPhyFifoEmpty() || !scsiPhyFifoAltEmpty())) {
\r
433 // Force a lock-up.
\r
436 if (newPhase != oldPhase)
\r
438 if ((newPhase == DATA_IN || newPhase == DATA_OUT) &&
\r
439 scsiDev.target->syncOffset)
\r
441 if (scsiDev.target->syncPeriod == 12)
\r
443 // SCSI2 FAST-20 Timing. 20MB/s.
\r
444 *SCSI_CTRL_TIMING = SCSI_FAST20_DESKEW;
\r
445 *SCSI_CTRL_TIMING2 = SCSI_FAST20_TIMING;
\r
447 else if (scsiDev.target->syncPeriod == 25)
\r
449 // SCSI2 FAST Timing. 10MB/s.
\r
450 *SCSI_CTRL_TIMING = SCSI_FAST10_DESKEW;
\r
451 *SCSI_CTRL_TIMING2 = SCSI_FAST10_TIMING;
\r
454 *SCSI_CTRL_TIMING = SCSI_DEFAULT_DESKEW;
\r
455 *SCSI_CTRL_TIMING2 = SCSI_DEFAULT_TIMING;
\r
457 *SCSI_CTRL_SYNC_OFFSET = scsiDev.target->syncOffset;
\r
459 *SCSI_CTRL_SYNC_OFFSET = 0;
\r
460 *SCSI_CTRL_TIMING = SCSI_DEFAULT_TIMING;
\r
463 *SCSI_CTRL_PHASE = newPhase;
\r
466 if (scsiDev.compatMode < COMPAT_SCSI2)
\r
474 void scsiPhyReset()
\r
476 trace(trace_scsiPhyReset);
\r
479 trace(trace_spinDMAReset);
\r
480 HAL_DMA_Abort(&memToFSMC);
\r
481 HAL_DMA_Abort(&fsmcToMem);
\r
486 *SCSI_CTRL_PHASE = 0x00;
\r
487 *SCSI_CTRL_BSY = 0x00;
\r
488 s2s_fpgaReset(); // Clears fifos etc.
\r
490 scsiPhyFifoSel = 0;
\r
491 *SCSI_FIFO_SEL = 0;
\r
492 *SCSI_CTRL_DBX = 0;
\r
494 *SCSI_CTRL_SYNC_OFFSET = 0;
\r
495 *SCSI_CTRL_TIMING = SCSI_DEFAULT_TIMING;
\r
497 // DMA Benchmark code
\r
498 // Currently 11MB/s.
\r
499 #ifdef DMA_BENCHMARK
\r
504 for (int i = 0; i < (100LL * 1024 * 1024 / SCSI_FIFO_DEPTH); ++i)
\r
508 (uint32_t) &scsiDev.data[0],
\r
509 (uint32_t) SCSI_FIFO_DATA,
\r
510 SCSI_FIFO_DEPTH / 4);
\r
512 HAL_DMA_PollForTransfer(
\r
514 HAL_DMA_FULL_TRANSFER,
\r
521 for(int i = 0; i < 10; ++i) s2s_delay_ms(1000);
\r
525 // FPGA comms test code
\r
529 for (int j = 0; j < SCSI_FIFO_DEPTH; ++j)
\r
531 scsiDev.data[j] = j;
\r
534 if (!scsiPhyFifoEmpty())
\r
539 *SCSI_CTRL_PHASE = DATA_IN;
\r
542 (uint32_t) &scsiDev.data[0],
\r
543 (uint32_t) SCSI_FIFO_DATA,
\r
544 SCSI_FIFO_DEPTH / 4);
\r
546 HAL_DMA_PollForTransfer(
\r
548 HAL_DMA_FULL_TRANSFER,
\r
551 if (!scsiPhyFifoFull())
\r
556 memset(&scsiDev.data[0], 0, SCSI_FIFO_DEPTH);
\r
558 *SCSI_CTRL_PHASE = DATA_OUT;
\r
561 (uint32_t) SCSI_FIFO_DATA,
\r
562 (uint32_t) &scsiDev.data[0],
\r
563 SCSI_FIFO_DEPTH / 2);
\r
565 HAL_DMA_PollForTransfer(
\r
567 HAL_DMA_FULL_TRANSFER,
\r
570 if (!scsiPhyFifoEmpty())
\r
576 for (int j = 0; j < SCSI_FIFO_DEPTH; ++j)
\r
578 if (scsiDev.data[j] != (uint8_t) j)
\r
591 static void scsiPhyInitDMA()
\r
593 // One-time init only.
\r
594 static uint8_t init = 0;
\r
599 // Memory to memory transfers can only be done using DMA2
\r
600 __DMA2_CLK_ENABLE();
\r
602 // Transmit SCSI data. The source data is treated as the
\r
603 // peripheral (even though this is memory-to-memory)
\r
604 memToFSMC.Instance = DMA2_Stream0;
\r
605 memToFSMC.Init.Channel = DMA_CHANNEL_0;
\r
606 memToFSMC.Init.Direction = DMA_MEMORY_TO_MEMORY;
\r
607 memToFSMC.Init.PeriphInc = DMA_PINC_ENABLE;
\r
608 memToFSMC.Init.MemInc = DMA_MINC_DISABLE;
\r
609 memToFSMC.Init.PeriphDataAlignment = DMA_PDATAALIGN_WORD;
\r
610 memToFSMC.Init.MemDataAlignment = DMA_MDATAALIGN_HALFWORD;
\r
611 memToFSMC.Init.Mode = DMA_NORMAL;
\r
612 memToFSMC.Init.Priority = DMA_PRIORITY_LOW;
\r
613 // FIFO mode is needed to allow conversion from 32bit words to the
\r
614 // 16bit FSMC interface.
\r
615 memToFSMC.Init.FIFOMode = DMA_FIFOMODE_ENABLE;
\r
617 // We only use 1 word (4 bytes) in the fifo at a time. Normally it's
\r
618 // better to let the DMA fifo fill up then do burst transfers, but
\r
619 // bursting out the FSMC interface will be very slow and may starve
\r
620 // other (faster) transfers. We don't want to risk the SDIO transfers
\r
621 // from overrun/underrun conditions.
\r
622 memToFSMC.Init.FIFOThreshold = DMA_FIFO_THRESHOLD_1QUARTERFULL;
\r
623 memToFSMC.Init.MemBurst = DMA_MBURST_SINGLE;
\r
624 memToFSMC.Init.PeriphBurst = DMA_PBURST_SINGLE;
\r
625 HAL_DMA_Init(&memToFSMC);
\r
627 // Receive SCSI data. The source data (fsmc) is treated as the
\r
628 // peripheral (even though this is memory-to-memory)
\r
629 fsmcToMem.Instance = DMA2_Stream1;
\r
630 fsmcToMem.Init.Channel = DMA_CHANNEL_0;
\r
631 fsmcToMem.Init.Direction = DMA_MEMORY_TO_MEMORY;
\r
632 fsmcToMem.Init.PeriphInc = DMA_PINC_DISABLE;
\r
633 fsmcToMem.Init.MemInc = DMA_MINC_ENABLE;
\r
634 fsmcToMem.Init.PeriphDataAlignment = DMA_PDATAALIGN_HALFWORD;
\r
635 fsmcToMem.Init.MemDataAlignment = DMA_MDATAALIGN_WORD;
\r
636 fsmcToMem.Init.Mode = DMA_NORMAL;
\r
637 fsmcToMem.Init.Priority = DMA_PRIORITY_LOW;
\r
638 fsmcToMem.Init.FIFOMode = DMA_FIFOMODE_ENABLE;
\r
639 fsmcToMem.Init.FIFOThreshold = DMA_FIFO_THRESHOLD_1QUARTERFULL;
\r
640 fsmcToMem.Init.MemBurst = DMA_MBURST_SINGLE;
\r
641 fsmcToMem.Init.PeriphBurst = DMA_PBURST_SINGLE;
\r
642 HAL_DMA_Init(&fsmcToMem);
\r
644 // TODO configure IRQs
\r
653 *SCSI_CTRL_IDMASK = 0x00; // Reset in scsiPhyConfig
\r
654 *SCSI_CTRL_PHASE = 0x00;
\r
655 *SCSI_CTRL_BSY = 0x00;
\r
656 scsiPhyFifoSel = 0;
\r
657 *SCSI_FIFO_SEL = 0;
\r
658 *SCSI_CTRL_DBX = 0;
\r
660 *SCSI_CTRL_SYNC_OFFSET = 0;
\r
661 *SCSI_CTRL_TIMING = SCSI_DEFAULT_TIMING;
\r
665 void scsiPhyConfig()
\r
667 if (scsiDev.boardCfg.flags6 & S2S_CFG_ENABLE_TERMINATOR)
\r
669 HAL_GPIO_WritePin(nTERM_EN_GPIO_Port, nTERM_EN_Pin, GPIO_PIN_RESET);
\r
673 HAL_GPIO_WritePin(nTERM_EN_GPIO_Port, nTERM_EN_Pin, GPIO_PIN_SET);
\r
677 uint8_t idMask = 0;
\r
678 for (int i = 0; i < 8; ++i)
\r
680 const S2S_TargetCfg* cfg = s2s_getConfigById(i);
\r
681 if (cfg && (cfg->scsiId & S2S_CFG_TARGET_ENABLED))
\r
683 idMask |= (1 << i);
\r
686 *SCSI_CTRL_IDMASK = idMask;
\r
691 // 2 = Parity error
\r
695 // 32 = other error
\r
698 if (scsiDev.phase != BUS_FREE)
\r
703 // Acquire the SCSI bus.
\r
704 for (int i = 0; i < 100; ++i)
\r
706 if (scsiStatusBSY())
\r
711 if (scsiStatusBSY())
\r
713 // Error, couldn't acquire scsi bus
\r
716 *SCSI_CTRL_BSY = 1;
\r
717 if (! scsiStatusBSY())
\r
719 // Error, BSY doesn't work.
\r
723 // Should be safe to use the bus now.
\r
730 for (i = 0; i < 256; ++i)
\r
732 *SCSI_CTRL_DBX = i;
\r
734 if (*SCSI_STS_DBX != (i & 0xff))
\r
738 /*if (Lookup_OddParity[i & 0xff] != SCSI_ReadPin(SCSI_In_DBP))
\r
743 *SCSI_CTRL_DBX = 0;
\r
745 // TEST MSG, CD, IO
\r
747 for (i = 0; i < 8; ++i)
\r
749 SCSI_CTL_PHASE_Write(i);
\r
752 if (SCSI_ReadPin(SCSI_In_MSG) != !!(i & __scsiphase_msg))
\r
756 if (SCSI_ReadPin(SCSI_In_CD) != !!(i & __scsiphase_cd))
\r
760 if (SCSI_ReadPin(SCSI_In_IO) != !!(i & __scsiphase_io))
\r
765 SCSI_CTL_PHASE_Write(0);
\r
767 uint32_t signalsOut[] = { SCSI_Out_ATN, SCSI_Out_BSY, SCSI_Out_RST, SCSI_Out_SEL };
\r
768 uint32_t signalsIn[] = { SCSI_Filt_ATN, SCSI_Filt_BSY, SCSI_Filt_RST, SCSI_Filt_SEL };
\r
770 for (i = 0; i < 4; ++i)
\r
772 SCSI_SetPin(signalsOut[i]);
\r
776 for (j = 0; j < 4; ++j)
\r
780 if (! SCSI_ReadFilt(signalsIn[j]))
\r
787 if (SCSI_ReadFilt(signalsIn[j]))
\r
793 SCSI_ClearPin(signalsOut[i]);
\r
797 *SCSI_CTRL_BSY = 0;
\r