1 // Copyright (C) 2013 Michael McMaster <michael@codesrc.com>
\r
3 // This file is part of SCSI2SD.
\r
5 // SCSI2SD is free software: you can redistribute it and/or modify
\r
6 // it under the terms of the GNU General Public License as published by
\r
7 // the Free Software Foundation, either version 3 of the License, or
\r
8 // (at your option) any later version.
\r
10 // SCSI2SD is distributed in the hope that it will be useful,
\r
11 // but WITHOUT ANY WARRANTY; without even the implied warranty of
\r
12 // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
\r
13 // GNU General Public License for more details.
\r
15 // You should have received a copy of the GNU General Public License
\r
16 // along with SCSI2SD. If not, see <http://www.gnu.org/licenses/>.
\r
18 #include "stm32f2xx.h"
\r
19 #include "stm32f2xx_hal.h"
\r
20 #include "stm32f2xx_hal_dma.h"
\r
23 #include "scsiPhy.h"
\r
31 // Private DMA variables.
\r
32 static int dmaInProgress = 0;
\r
34 static DMA_HandleTypeDef memToFSMC;
\r
35 static DMA_HandleTypeDef fsmcToMem;
\r
38 volatile uint8_t scsiRxDMAComplete;
\r
39 volatile uint8_t scsiTxDMAComplete;
\r
42 CY_ISR_PROTO(scsiRxCompleteISR);
\r
43 CY_ISR(scsiRxCompleteISR)
\r
45 traceIrq(trace_scsiRxCompleteISR);
\r
46 scsiRxDMAComplete = 1;
\r
49 CY_ISR_PROTO(scsiTxCompleteISR);
\r
50 CY_ISR(scsiTxCompleteISR)
\r
52 traceIrq(trace_scsiTxCompleteISR);
\r
53 scsiTxDMAComplete = 1;
\r
57 uint8_t scsiPhyFifoSel = 0; // global
\r
59 // scsi IRQ handler is initialised by the STM32 HAL. Connected to
\r
61 // Note: naming is important to ensure this function is listed in the
\r
63 void EXTI4_IRQHandler()
\r
65 traceIrq(trace_scsiResetISR);
\r
67 // Make sure that interrupt flag is set
\r
68 if (__HAL_GPIO_EXTI_GET_IT(GPIO_PIN_4) != RESET) {
\r
70 // Clear interrupt flag
\r
71 __HAL_GPIO_EXTI_CLEAR_IT(GPIO_PIN_4);
\r
73 scsiDev.resetFlag = scsiDev.resetFlag || scsiStatusRST();
\r
74 // TODO grab SEL status as well
\r
79 static void assertFail()
\r
91 startScsiRx(uint32_t count)
\r
93 *SCSI_DATA_CNT_HI = count >> 8;
\r
94 *SCSI_DATA_CNT_LO = count & 0xff;
\r
95 *SCSI_DATA_CNT_SET = 1;
\r
102 if (!scsiPhyFifoAltEmpty()) {
\r
103 // Force a lock-up.
\r
109 trace(trace_spinPhyRxFifo);
\r
110 while (!scsiPhyComplete() && likely(!scsiDev.resetFlag)) {}
\r
112 uint8_t val = scsiPhyRx();
\r
113 // TODO scsiDev.parityError = scsiDev.parityError || SCSI_Parity_Error_Read();
\r
116 if (!scsiPhyFifoEmpty()) {
\r
118 uint8_t k __attribute((unused));
\r
119 while (!scsiPhyFifoEmpty()) { k = scsiPhyRx(); ++j; }
\r
121 // Force a lock-up.
\r
130 scsiReadPIO(uint8_t* data, uint32_t count)
\r
132 for (int i = 0; i < count; ++i)
\r
134 data[i] = scsiPhyRx();
\r
136 // TODO scsiDev.parityError = scsiDev.parityError || SCSI_Parity_Error_Read();
\r
140 scsiReadDMA(uint8_t* data, uint32_t count)
\r
142 // Prepare DMA transfer
\r
144 trace(trace_doRxSingleDMA);
\r
146 scsiTxDMAComplete = 1; // TODO not used much
\r
147 scsiRxDMAComplete = 0; // TODO not used much
\r
149 HAL_DMA_Start(&fsmcToMem, (uint32_t) SCSI_FIFO_DATA, (uint32_t) data, count);
\r
155 int complete = __HAL_DMA_GET_COUNTER(&fsmcToMem) == 0;
\r
156 complete = complete && (HAL_DMA_PollForTransfer(&fsmcToMem, HAL_DMA_FULL_TRANSFER, 0xffffffff) == HAL_OK);
\r
159 scsiTxDMAComplete = 1; // TODO MM FIX IRQ
\r
160 scsiRxDMAComplete = 1;
\r
164 // TODO MM scsiDev.parityError = scsiDev.parityError || SCSI_Parity_Error_Read();
\r
176 scsiRead(uint8_t* data, uint32_t count)
\r
181 uint32_t chunk = ((count - i) > SCSI_FIFO_DEPTH)
\r
182 ? SCSI_FIFO_DEPTH : (count - i);
\r
185 // DMA is doing 32bit transfers.
\r
186 chunk = chunk & 0xFFFFFFF8;
\r
188 startScsiRx(chunk);
\r
190 while (i < count && likely(!scsiDev.resetFlag))
\r
192 while (!scsiPhyComplete() && likely(!scsiDev.resetFlag)) {}
\r
195 uint32_t nextChunk = ((count - i - chunk) > SCSI_FIFO_DEPTH)
\r
196 ? SCSI_FIFO_DEPTH : (count - i - chunk);
\r
197 if (nextChunk >= 16)
\r
199 nextChunk = nextChunk & 0xFFFFFFF8;
\r
203 startScsiRx(nextChunk);
\r
208 scsiReadPIO(data + i, chunk);
\r
212 scsiReadDMA(data + i, chunk);
\r
214 trace(trace_spinReadDMAPoll);
\r
216 while (!scsiReadDMAPoll() && likely(!scsiDev.resetFlag))
\r
222 if (!scsiPhyFifoEmpty()) {
\r
224 while (!scsiPhyFifoEmpty()) { scsiPhyRx(); ++j; }
\r
225 // Force a lock-up.
\r
235 scsiWriteByte(uint8_t value)
\r
238 if (!scsiPhyFifoEmpty()) {
\r
239 // Force a lock-up.
\r
243 trace(trace_spinPhyTxFifo);
\r
247 trace(trace_spinTxComplete);
\r
248 while (!scsiPhyComplete() && likely(!scsiDev.resetFlag)) {}
\r
251 if (!scsiPhyFifoAltEmpty()) {
\r
252 // Force a lock-up.
\r
259 scsiWritePIO(const uint8_t* data, uint32_t count)
\r
261 for (int i = 0; i < count; ++i)
\r
263 scsiPhyTx(data[i]);
\r
268 scsiWriteDMA(const uint8_t* data, uint32_t count)
\r
270 // Prepare DMA transfer
\r
272 trace(trace_doTxSingleDMA);
\r
274 scsiTxDMAComplete = 0;
\r
275 scsiRxDMAComplete = 1;
\r
280 (uint32_t) SCSI_FIFO_DATA,
\r
287 int complete = __HAL_DMA_GET_COUNTER(&memToFSMC) == 0;
\r
288 complete = complete && (HAL_DMA_PollForTransfer(&memToFSMC, HAL_DMA_FULL_TRANSFER, 0xffffffff) == HAL_OK);
\r
291 scsiTxDMAComplete = 1; // TODO MM FIX IRQ
\r
292 scsiRxDMAComplete = 1;
\r
304 scsiWrite(const uint8_t* data, uint32_t count)
\r
307 while (i < count && likely(!scsiDev.resetFlag))
\r
309 uint32_t chunk = ((count - i) > SCSI_FIFO_DEPTH)
\r
310 ? SCSI_FIFO_DEPTH : (count - i);
\r
313 if (!scsiPhyFifoEmpty()) {
\r
314 // Force a lock-up.
\r
321 scsiWritePIO(data + i, chunk);
\r
325 // DMA is doing 32bit transfers.
\r
326 chunk = chunk & 0xFFFFFFF8;
\r
327 scsiWriteDMA(data + i, chunk);
\r
329 trace(trace_spinReadDMAPoll);
\r
331 while (!scsiWriteDMAPoll() && likely(!scsiDev.resetFlag))
\r
336 while (!scsiPhyComplete() && likely(!scsiDev.resetFlag))
\r
341 if (!scsiPhyFifoAltEmpty()) {
\r
342 // Force a lock-up.
\r
350 while (!scsiPhyComplete() && likely(!scsiDev.resetFlag))
\r
355 if (!scsiPhyFifoAltEmpty()) {
\r
356 // Force a lock-up.
\r
362 static inline void busSettleDelay(void)
\r
364 // Data Release time (switching IO) = 400ns
\r
365 // + Bus Settle time (switching phase) = 400ns.
\r
366 s2s_delay_us(1); // Close enough.
\r
369 void scsiEnterBusFree()
\r
371 *SCSI_CTRL_BSY = 0x00;
\r
372 // We now have a Bus Clear Delay of 800ns to release remaining signals.
\r
373 *SCSI_CTRL_PHASE = 0;
\r
376 void scsiEnterPhase(int phase)
\r
378 // ANSI INCITS 362-2002 SPI-3 10.7.1:
\r
379 // Phase changes are not allowed while REQ or ACK is asserted.
\r
380 while (likely(!scsiDev.resetFlag) && scsiStatusACK()) {}
\r
382 int newPhase = phase > 0 ? phase : 0;
\r
383 int oldPhase = *SCSI_CTRL_PHASE;
\r
385 if (!scsiPhyFifoEmpty() || !scsiPhyFifoAltEmpty()) {
\r
386 // Force a lock-up.
\r
389 if (newPhase != oldPhase)
\r
391 *SCSI_CTRL_PHASE = newPhase;
\r
394 if (scsiDev.compatMode < COMPAT_SCSI2)
\r
402 void scsiPhyReset()
\r
404 trace(trace_scsiPhyReset);
\r
407 trace(trace_spinDMAReset);
\r
408 HAL_DMA_Abort(&memToFSMC);
\r
409 HAL_DMA_Abort(&fsmcToMem);
\r
415 // Set the Clear bits for both SCSI device FIFOs
\r
416 scsiTarget_AUX_CTL = scsiTarget_AUX_CTL | 0x03;
\r
418 // Trigger RST outselves. It is connected to the datapath and will
\r
419 // ensure it returns to the idle state. The datapath runs at the BUS clk
\r
420 // speed (ie. same as the CPU), so we can be sure it is active for a sufficient
\r
422 SCSI_RST_ISR_Disable();
\r
423 SCSI_SetPin(SCSI_Out_RST);
\r
425 SCSI_CTL_PHASE_Write(0);
\r
426 SCSI_ClearPin(SCSI_Out_ATN);
\r
427 SCSI_ClearPin(SCSI_Out_BSY);
\r
428 SCSI_ClearPin(SCSI_Out_ACK);
\r
429 SCSI_ClearPin(SCSI_Out_RST);
\r
430 SCSI_ClearPin(SCSI_Out_SEL);
\r
431 SCSI_ClearPin(SCSI_Out_REQ);
\r
433 // Allow the FIFOs to fill up again.
\r
434 SCSI_ClearPin(SCSI_Out_RST);
\r
435 SCSI_RST_ISR_Enable();
\r
436 scsiTarget_AUX_CTL = scsiTarget_AUX_CTL & ~(0x03);
\r
438 SCSI_Parity_Error_Read(); // clear sticky bits
\r
441 *SCSI_CTRL_PHASE = 0x00;
\r
442 *SCSI_CTRL_BSY = 0x00;
\r
443 s2s_fpgaReset(); // Clears fifos etc.
\r
445 scsiPhyFifoSel = 0;
\r
446 *SCSI_FIFO_SEL = 0;
\r
447 *SCSI_CTRL_DBX = 0;
\r
449 // DMA Benchmark code
\r
450 // Currently 10MB/s. Assume 20MB/s is achievable with 16 bits.
\r
451 #ifdef DMA_BENCHMARK
\r
456 for (int i = 0; i < (100LL * 1024 * 1024 / SCSI_FIFO_DEPTH); ++i)
\r
460 (uint32_t) &scsiDev.data[0],
\r
461 (uint32_t) SCSI_FIFO_DATA,
\r
462 SCSI_FIFO_DEPTH / 4);
\r
464 HAL_DMA_PollForTransfer(
\r
466 HAL_DMA_FULL_TRANSFER,
\r
473 for(int i = 0; i < 10; ++i) s2s_delay_ms(1000);
\r
477 // FPGA comms test code
\r
481 for (int j = 0; j < SCSI_FIFO_DEPTH; ++j)
\r
483 scsiDev.data[j] = j;
\r
486 if (!scsiPhyFifoEmpty())
\r
491 *SCSI_CTRL_PHASE = DATA_IN;
\r
494 (uint32_t) &scsiDev.data[0],
\r
495 (uint32_t) SCSI_FIFO_DATA,
\r
496 SCSI_FIFO_DEPTH / 4);
\r
498 HAL_DMA_PollForTransfer(
\r
500 HAL_DMA_FULL_TRANSFER,
\r
503 if (!scsiPhyFifoFull())
\r
508 memset(&scsiDev.data[0], 0, SCSI_FIFO_DEPTH);
\r
510 *SCSI_CTRL_PHASE = DATA_OUT;
\r
513 (uint32_t) SCSI_FIFO_DATA,
\r
514 (uint32_t) &scsiDev.data[0],
\r
517 HAL_DMA_PollForTransfer(
\r
519 HAL_DMA_FULL_TRANSFER,
\r
522 if (!scsiPhyFifoEmpty())
\r
528 for (int j = 0; j < SCSI_FIFO_DEPTH; ++j)
\r
530 if (scsiDev.data[j] != (uint8_t) j)
\r
543 static void scsiPhyInitDMA()
\r
545 // One-time init only.
\r
546 static uint8_t init = 0;
\r
551 // Memory to memory transfers can only be done using DMA2
\r
552 __DMA2_CLK_ENABLE();
\r
554 // Transmit SCSI data. The source data is treated as the
\r
555 // peripheral (even though this is memory-to-memory)
\r
556 memToFSMC.Instance = DMA2_Stream0;
\r
557 memToFSMC.Init.Channel = DMA_CHANNEL_0;
\r
558 memToFSMC.Init.Direction = DMA_MEMORY_TO_MEMORY;
\r
559 memToFSMC.Init.PeriphInc = DMA_PINC_ENABLE;
\r
560 memToFSMC.Init.MemInc = DMA_MINC_DISABLE;
\r
561 memToFSMC.Init.PeriphDataAlignment = DMA_PDATAALIGN_WORD;
\r
562 memToFSMC.Init.MemDataAlignment = DMA_MDATAALIGN_BYTE;
\r
563 memToFSMC.Init.Mode = DMA_NORMAL;
\r
564 memToFSMC.Init.Priority = DMA_PRIORITY_LOW;
\r
565 // FIFO mode is needed to allow conversion from 32bit words to the
\r
566 // 8bit FSMC interface.
\r
567 memToFSMC.Init.FIFOMode = DMA_FIFOMODE_ENABLE;
\r
569 // We only use 1 word (4 bytes) in the fifo at a time. Normally it's
\r
570 // better to let the DMA fifo fill up then do burst transfers, but
\r
571 // bursting out the FSMC interface will be very slow and may starve
\r
572 // other (faster) transfers. We don't want to risk the SDIO transfers
\r
573 // from overrun/underrun conditions.
\r
574 memToFSMC.Init.FIFOThreshold = DMA_FIFO_THRESHOLD_1QUARTERFULL;
\r
575 memToFSMC.Init.MemBurst = DMA_MBURST_SINGLE;
\r
576 memToFSMC.Init.PeriphBurst = DMA_PBURST_SINGLE;
\r
577 HAL_DMA_Init(&memToFSMC);
\r
579 // Receive SCSI data. The source data (fsmc) is treated as the
\r
580 // peripheral (even though this is memory-to-memory)
\r
581 fsmcToMem.Instance = DMA2_Stream1;
\r
582 fsmcToMem.Init.Channel = DMA_CHANNEL_0;
\r
583 fsmcToMem.Init.Direction = DMA_MEMORY_TO_MEMORY;
\r
584 fsmcToMem.Init.PeriphInc = DMA_PINC_DISABLE;
\r
585 fsmcToMem.Init.MemInc = DMA_MINC_ENABLE;
\r
586 fsmcToMem.Init.PeriphDataAlignment = DMA_PDATAALIGN_BYTE;
\r
587 fsmcToMem.Init.MemDataAlignment = DMA_MDATAALIGN_WORD;
\r
588 fsmcToMem.Init.Mode = DMA_NORMAL;
\r
589 fsmcToMem.Init.Priority = DMA_PRIORITY_LOW;
\r
590 fsmcToMem.Init.FIFOMode = DMA_FIFOMODE_ENABLE;
\r
591 fsmcToMem.Init.FIFOThreshold = DMA_FIFO_THRESHOLD_1QUARTERFULL;
\r
592 fsmcToMem.Init.MemBurst = DMA_MBURST_SINGLE;
\r
593 fsmcToMem.Init.PeriphBurst = DMA_PBURST_SINGLE;
\r
594 HAL_DMA_Init(&fsmcToMem);
\r
596 // TODO configure IRQs
\r
605 *SCSI_CTRL_IDMASK = 0x00; // Reset in scsiPhyConfig
\r
606 *SCSI_CTRL_PHASE = 0x00;
\r
607 *SCSI_CTRL_BSY = 0x00;
\r
608 scsiPhyFifoSel = 0;
\r
609 *SCSI_FIFO_SEL = 0;
\r
610 *SCSI_CTRL_DBX = 0;
\r
614 void scsiPhyConfig()
\r
616 if (scsiDev.boardCfg.flags6 & S2S_CFG_ENABLE_TERMINATOR)
\r
618 HAL_GPIO_WritePin(nTERM_EN_GPIO_Port, nTERM_EN_Pin, GPIO_PIN_RESET);
\r
622 HAL_GPIO_WritePin(nTERM_EN_GPIO_Port, nTERM_EN_Pin, GPIO_PIN_SET);
\r
626 uint8_t idMask = 0;
\r
627 for (int i = 0; i < 8; ++i)
\r
629 const S2S_TargetCfg* cfg = s2s_getConfigById(i);
\r
630 if (cfg && (cfg->scsiId & S2S_CFG_TARGET_ENABLED))
\r
632 idMask |= (1 << i);
\r
635 *SCSI_CTRL_IDMASK = idMask;
\r
640 // 2 = Parity error
\r
644 // 32 = other error
\r
647 if (scsiDev.phase != BUS_FREE)
\r
652 // Acquire the SCSI bus.
\r
653 for (int i = 0; i < 100; ++i)
\r
655 if (scsiStatusBSY())
\r
660 if (scsiStatusBSY())
\r
662 // Error, couldn't acquire scsi bus
\r
665 *SCSI_CTRL_BSY = 1;
\r
666 if (! scsiStatusBSY())
\r
668 // Error, BSY doesn't work.
\r
672 // Should be safe to use the bus now.
\r
679 for (i = 0; i < 256; ++i)
\r
681 *SCSI_CTRL_DBX = i;
\r
683 if (*SCSI_STS_DBX != (i & 0xff))
\r
687 /*if (Lookup_OddParity[i & 0xff] != SCSI_ReadPin(SCSI_In_DBP))
\r
692 *SCSI_CTRL_DBX = 0;
\r
694 // TEST MSG, CD, IO
\r
696 for (i = 0; i < 8; ++i)
\r
698 SCSI_CTL_PHASE_Write(i);
\r
701 if (SCSI_ReadPin(SCSI_In_MSG) != !!(i & __scsiphase_msg))
\r
705 if (SCSI_ReadPin(SCSI_In_CD) != !!(i & __scsiphase_cd))
\r
709 if (SCSI_ReadPin(SCSI_In_IO) != !!(i & __scsiphase_io))
\r
714 SCSI_CTL_PHASE_Write(0);
\r
716 uint32_t signalsOut[] = { SCSI_Out_ATN, SCSI_Out_BSY, SCSI_Out_RST, SCSI_Out_SEL };
\r
717 uint32_t signalsIn[] = { SCSI_Filt_ATN, SCSI_Filt_BSY, SCSI_Filt_RST, SCSI_Filt_SEL };
\r
719 for (i = 0; i < 4; ++i)
\r
721 SCSI_SetPin(signalsOut[i]);
\r
725 for (j = 0; j < 4; ++j)
\r
729 if (! SCSI_ReadFilt(signalsIn[j]))
\r
736 if (SCSI_ReadFilt(signalsIn[j]))
\r
742 SCSI_ClearPin(signalsOut[i]);
\r
746 *SCSI_CTRL_BSY = 0;
\r