source: trunk/src/os2ahci/ata.c@ 125

Last change on this file since 125 was 125, checked in by cjm, 14 years ago

Version 1.21


  • Triggered by reports of performance loss with NCQ
  • New command line flag "/F" to force using write buffers even when upstream I/O requested non-buffered I/O; the primary purpose of this flag is to debug the NCQ performance drop but the flag may or may not remain.
File size: 40.1 KB
Line 
1/******************************************************************************
2 * ata.c - ATA command processing
3 *
4 * Copyright (c) 2011 thi.guten Software Development
5 * Copyright (c) 2011 Mensys B.V.
6 *
7 * Authors: Christian Mueller, Markus Thielen
8 *
9 * Parts copied from/inspired by the Linux AHCI driver;
10 * those parts are (c) Linux AHCI/ATA maintainers
11 *
12 * This program is free software; you can redistribute it and/or modify
13 * it under the terms of the GNU General Public License as published by
14 * the Free Software Foundation; either version 2 of the License, or
15 * (at your option) any later version.
16 *
17 * This program is distributed in the hope that it will be useful,
18 * but WITHOUT ANY WARRANTY; without even the implied warranty of
19 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
20 * GNU General Public License for more details.
21 *
22 * You should have received a copy of the GNU General Public License
23 * along with this program; if not, write to the Free Software
24 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
25 */
26
27#include "os2ahci.h"
28#include "ata.h"
29
30/* -------------------------- macros and constants ------------------------- */
31
32/* ------------------------ typedefs and structures ------------------------ */
33
34/* -------------------------- function prototypes -------------------------- */
35
36static int ata_cmd_read (IORBH _far *iorb, AD_INFO *ai, int p, int d, int slot,
37 ULONG sector, ULONG count, SCATGATENTRY _far *sg_list,
38 ULONG sg_cnt);
39
40static int ata_cmd_write(IORBH _far *iorb, AD_INFO *ai, int p, int d, int slot,
41 ULONG sector, ULONG count, SCATGATENTRY _far *sg_list,
42 ULONG sg_cnt, int write_through);
43
44/* ------------------------ global/static variables ------------------------ */
45
46/* ----------------------------- start of code ----------------------------- */
47
48/******************************************************************************
49 * Initialize AHCI command slot, FIS and S/G list for the specified ATA
50 * command. The command parameters are passed as a variable argument list
51 * of type and value(s). The list is terminated by AP_END.
52 *
53 * Notes:
54 *
55 * - The specified command slot is expected to be idle; no checks are
56 * performed to prevent messing with a busy port.
57 *
58 * - Port multipliers are not supported, yet, thus 'd' should always
59 * be 0 for the time being.
60 *
61 * - 'cmd' is passed as 16-bit integer because the compiler would push
62 * a 'u8' as 16-bit value (it's a fixed argument) and the stdarg
63 * macros would screw up the address of the first variable argument
64 * if the size of the last fixed argument wouldn't match what the
65 * compiler pushed on the stack.
66 *
67 * Return values:
68 * 0 : success
69 * > 0 : could not map all S/G entries; the return value is the number of
70 * S/G entries that could be mapped.
71 * < 0 : other error
72 */
73int ata_cmd(AD_INFO *ai, int p, int d, int slot, int cmd, ...)
74{
75 va_list va;
76 va_start(va, cmd);
77 return(v_ata_cmd(ai, p, d, slot, cmd, va));
78}
79
80int v_ata_cmd(AD_INFO *ai, int p, int d, int slot, int cmd, va_list va)
81{
82 AHCI_PORT_DMA _far *dma_base_virt;
83 AHCI_CMD_HDR _far *cmd_hdr;
84 AHCI_CMD_TBL _far *cmd_tbl;
85 SCATGATENTRY _far *sg_list = NULL;
86 SCATGATENTRY sg_single;
87 ATA_PARM ap;
88 ATA_CMD ata_cmd;
89 void _far *atapi_cmd = NULL;
90 u32 dma_base_phys;
91 u16 atapi_cmd_len = 0;
92 u16 ahci_flags = 0;
93 u16 sg_cnt = 0;
94 int i;
95 int n;
96
97 /* --------------------------------------------------------------------------
98 * Initialize ATA command. The ATA command is set up with the main command
99 * value and a variable list of additional parameters such as the sector
100 * address, transfer count, ...
101 */
102 memset(&ata_cmd, 0x00, sizeof(ata_cmd));
103 ata_cmd.cmd = (u8) cmd;
104
105 /* parse variable arguments */
106 do {
107 switch ((ap = va_arg(va, ATA_PARM))) {
108
109 case AP_AHCI_FLAGS:
110 ahci_flags |= va_arg(va, u16);
111 break;
112
113 case AP_WRITE:
114 if (va_arg(va, u16) != 0) {
115 ahci_flags |= AHCI_CMD_WRITE;
116 }
117 break;
118
119 case AP_FEATURES:
120 /* ATA features word */
121 ata_cmd.features |= va_arg(va, u16);
122 break;
123
124 case AP_COUNT:
125 /* transfer count */
126 ata_cmd.count = va_arg(va, u16);
127 break;
128
129 case AP_SECTOR_28:
130 /* 28-bit sector address */
131 ata_cmd.lba_l = va_arg(va, u32);
132 if (ata_cmd.lba_l & 0xf0000000UL) {
133 dprintf("error: LBA-28 address %ld has more than 28 bits\n", ata_cmd.lba_l);
134 return(ATA_CMD_INVALID_PARM);
135 }
136 /* add upper 4 bits to device field */
137 ata_cmd.device |= (ata_cmd.lba_l >> 24) & 0x0fU;
138 /* only lower 24 bits come into lba_l */
139 ata_cmd.lba_l &= 0x00ffffffUL;
140 break;
141
142 case AP_SECTOR_48:
143 /* 48-bit sector address */
144 ata_cmd.lba_l = va_arg(va, u32);
145 ata_cmd.lba_h = va_arg(va, u16);
146 break;
147
148 case AP_DEVICE:
149 /* ATA device byte; note that this byte contains the highest
150 * 4 bits of LBA-28 address; we have to leave them alone here. */
151 ata_cmd.device |= va_arg(va, u16) & 0xf0U;
152 break;
153
154 case AP_SGLIST:
155 /* scatter/gather list in SCATGATENTRY/count format */
156 sg_list = va_arg(va, void _far *);
157 sg_cnt = va_arg(va, u16);
158 break;
159
160 case AP_VADDR:
161 /* virtual buffer address in addr/len format (up to 4K) */
162 sg_single.ppXferBuf = virt_to_phys(va_arg(va, void _far *));
163 sg_single.XferBufLen = va_arg(va, u16);
164 sg_list = &sg_single;
165 sg_cnt = 1;
166 break;
167
168 case AP_ATAPI_CMD:
169 /* ATAPI command */
170 atapi_cmd = va_arg(va, void _far *);
171 atapi_cmd_len = va_arg(va, u16);
172 ahci_flags |= AHCI_CMD_ATAPI;
173 break;
174
175 case AP_ATA_CMD:
176 /* ATA command "pass-through" */
177 memcpy(&ata_cmd, va_arg(va, void _far *), sizeof(ATA_CMD));
178 break;
179
180 case AP_END:
181 break;
182
183 default:
184 dprintf("error: v_ata_cmd() called with invalid parameter type (%d)\n", (int) ap);
185 return(ATA_CMD_INVALID_PARM);
186 }
187
188 } while (ap != AP_END);
189
190 /* --------------------------------------------------------------------------
191 * Fill in AHCI ATA command information. This includes the port command slot,
192 * the corresponding command FIS and the S/G list. The layout of the AHCI
193 * port DMA region is based on the Linux AHCI driver and looks like this:
194 *
195 * - 32 AHCI command headers (AHCI_CMD_HDR) with 32 bytes, each
196 * - 1 FIS receive area with 256 bytes (AHCI_RX_FIS_SZ)
197 * - 32 AHCI command tables, each consisting of
198 * - 64 bytes for command FIS
199 * - 16 bytes for ATAPI comands
200 * - 48 bytes reserved
201 * - 48 S/G entries (AHCI_SG) with 32 bytes, each
202 *
203 * Since the whole DMA buffer for all ports is larger than 64KB and we need
204 * multiple segments to address all of them, there are no virtual pointers
205 * to the individual elements in AD_INFO. Instead, we're relying on macros
206 * for getting the base address of a particular port's DMA region, then
207 * map a structure on top of that for convenience (AHCI_PORT_DMA).
208 */
209 dma_base_virt = port_dma_base(ai, p);
210 dma_base_phys = port_dma_base_phys(ai, p);
211
212 /* AHCI command header */
213 cmd_hdr = dma_base_virt->cmd_hdr + slot;
214 memset(cmd_hdr, 0x00, sizeof(*cmd_hdr));
215 cmd_hdr->options = ((d & 0x0f) << 12);
216 cmd_hdr->options |= ahci_flags; /* AHCI command flags */
217 cmd_hdr->options |= 5; /* length of command FIS in 32-bit words */
218 cmd_hdr->tbl_addr = dma_base_phys + offsetof(AHCI_PORT_DMA, cmd_tbl[slot]);
219
220 /* AHCI command table */
221 cmd_tbl = dma_base_virt->cmd_tbl + slot;
222 memset(cmd_tbl, 0x00, sizeof(*cmd_tbl));
223 ata_cmd_to_fis(cmd_tbl->cmd_fis, &ata_cmd, d);
224
225 if (atapi_cmd != NULL) {
226 /* copy ATAPI command */
227 memcpy(cmd_tbl->atapi_cmd, atapi_cmd, atapi_cmd_len);
228 }
229
230 /* PRDT (S/G list)
231 *
232 * - The S/G list for AHCI adapters is limited to 22 bits for the transfer
233 * size of each element, thus we need to split S/G elements larger than
234 * 22 bits into 2 AHCI_SG elements.
235 *
236 * - The S/G element size for AHCI is what the spec calls '0'-based
237 * (i.e. 0 means 1 bytes). On top of that, the spec requires S/G transfer
238 * sizes to be even in the context of 16-bit transfers, thus bit '1'
239 * always needs to be set.
240 *
241 * - AHCI_MAX_SG_ELEMENT_LEN defines the maximum size of an AHCI S/G
242 * element in bytes, ignoring the '0'-based methodology (i.e. 1 << 22).
243 *
244 * - There's a limit on the maximum number of S/G elements in the port DMA
245 * buffer (AHCI_MAX_SG) which is lower than the HW maximum. It's beyond
246 * the control of this function to split commands which require more
247 * than AHCI_MAX_SG entries. In order to help the caller, the return value
248 * of this function will indicate how many OS/2 S/G entries were
249 * successfully mapped.
250 */
251 for (i = n = 0; i < sg_cnt; i++) {
252 u32 sg_addr = sg_list[i].ppXferBuf;
253 u32 sg_size = sg_list[i].XferBufLen;
254
255 do {
256 u32 chunk = (sg_size > AHCI_MAX_SG_ELEMENT_LEN) ? AHCI_MAX_SG_ELEMENT_LEN
257 : sg_size;
258 if (n >= AHCI_MAX_SG) {
259 /* couldn't store all S/G elements in our DMA buffer */
260 ddprintf("ata_cmd(): too many S/G elements\n");
261 return(i - 1);
262 }
263 if ((sg_addr & 1) || (chunk & 1)) {
264 ddprintf("error: ata_cmd() called with unaligned S/G element(s)\n");
265 return(ATA_CMD_UNALIGNED_ADDR);
266 }
267 cmd_tbl->sg_list[n].addr = sg_addr;
268 cmd_tbl->sg_list[n].size = chunk - 1;
269 sg_addr += chunk;
270 sg_size -= chunk;
271 n++;
272 } while (sg_size > 0);
273 }
274
275 /* set final S/G count in AHCI command header */
276 cmd_hdr->options |= (u32) n << 16;
277
278 if (debug >= 2) {
279 printf("ATA command for %d.%d.%d, slot %d:\n", ad_no(ai), p, d, slot);
280 phex(cmd_hdr, offsetof(AHCI_CMD_HDR, reserved), "cmd_hdr: ");
281 phex(&ata_cmd, sizeof(ata_cmd), "ata_cmd: ");
282 if (atapi_cmd != NULL) {
283 phex(atapi_cmd, atapi_cmd_len, "atapi_cmd: ");
284 }
285 if (n > 0) {
286 phex(cmd_tbl->sg_list, sizeof(*cmd_tbl->sg_list) * n, "sg_list: ");
287 }
288 }
289
290 return(ATA_CMD_SUCCESS);
291}
292
293/******************************************************************************
294 * Fill SATA command FIS with values extracted from an ATA command structure.
295 * The command FIS buffer (fis) is expected to be initialized to 0s. The
296 * structure of the FIS maps to the ATA shadow register block, including
297 * registers which can be written twice to store 16 bits (called 'exp').
298 *
299 * The FIS structure looks like this (using LSB notation):
300 *
301 * +----------------+----------------+----------------+----------------+
302 * 00 | FIS type (27h) | C|R|R|R|PMP | Command | Features |
303 * +----------------+----------------+----------------+----------------+
304 * 04 | LBA 7:0 | LBA 15:8 | LBA 23:16 | R|R|R|D|Head |
305 * +----------------+----------------+----------------+----------------+
306 * 08 | LBA 31:24 | LBA 40:32 | LBA 47:40 | Features exp |
307 * +----------------+----------------+----------------+----------------+
308 * 12 | Count 7:0 | Count 15:8 | Reserved | Control |
309 * +----------------+----------------+----------------+----------------+
310 * 16 | Reserved | Reserved | Reserved | Reserved |
311 * +----------------+----------------+----------------+----------------+
312 */
313void ata_cmd_to_fis(u8 _far *fis, ATA_CMD _far *ata_cmd, int d)
314{
315 fis[0] = 0x27; /* register - host to device FIS */
316 fis[1] = (u8) (d & 0xf); /* port multiplier number */
317 fis[1] |= 0x80; /* bit 7 indicates Command FIS */
318 fis[2] = (u8) ata_cmd->cmd;
319 fis[3] = (u8) ata_cmd->features;
320
321 fis[4] = (u8) ata_cmd->lba_l;
322 fis[5] = (u8) (ata_cmd->lba_l >> 8);
323 fis[6] = (u8) (ata_cmd->lba_l >> 16);
324 fis[7] = (u8) ata_cmd->device;
325
326 fis[8] = (u8) (ata_cmd->lba_l >> 24);
327 fis[9] = (u8) ata_cmd->lba_h;
328 fis[10] = (u8) (ata_cmd->lba_h >> 8);
329 fis[11] = (u8) (ata_cmd->features >> 8);
330
331 fis[12] = (u8) ata_cmd->count;
332 fis[13] = (u8) (ata_cmd->count >> 8);
333}
334
335/******************************************************************************
336 * Get index in S/G list for the number of transferred sectors in the IORB.
337 *
338 * Returning io->cSGList indicates an error.
339 *
340 * NOTE: OS/2 makes sure S/G lists are set up such that entries at the HW
341 * limit will never cross sector boundaries. This means that splitting
342 * S/G lists into multiple commands can be done without editing the S/G
343 * lists.
344 */
345u16 ata_get_sg_indx(IORB_EXECUTEIO _far *io)
346{
347 ULONG offset = io->BlocksXferred * io->BlockSize;
348 USHORT i;
349
350 for (i = 0; i < io->cSGList && offset > 0; i++) {
351 offset -= io->pSGList[i].XferBufLen;
352 }
353
354 return(i);
355}
356
357/******************************************************************************
358 * Get max S/G count which will fit into our HW S/G buffers. This function is
359 * called when the S/G list is too long and we need to split the IORB into
360 * multiple commands. It returns both the number of sectors and S/G list
361 * elements that we can handle in a single command.
362 *
363 * The parameter 'sg_indx' indicates the current start index in the S/G list
364 * (0 if this is the first command iteration).
365 *
366 * The parameter 'sg_max' is the return value of v_ata_cmd() and indicates
367 * how many S/G elements were successfully mapped. Whatever we return needs to
368 * be less or equal to this value.
369 *
370 * Returning 0 in *sg_cnt indicates an error.
371 *
372 * NOTE: OS/2 makes sure S/G lists are set up such that entries at HW limits
373 * will never cross sector boundaries. This means that splitting S/G
374 * lists into multiple commands can be done without editing S/G list
375 * elements. Since AHCI only allows 22 bits for each S/G element, the
376 * hardware limits are reported as AHCI_MAX_SG / 2 but will vary based
377 * on the actual length of S/G elements. This function looks for the
378 * maximum number of S/G elements that can be mapped on sector
379 * boundaries which will still fit into our HW S/G list.
380 */
381void ata_max_sg_cnt(IORB_EXECUTEIO _far *io, USHORT sg_indx, USHORT sg_max,
382 USHORT _far *sg_cnt, USHORT _far *sector_cnt)
383{
384 ULONG max_sector_cnt = 0;
385 USHORT max_sg_cnt = 0;
386 ULONG offset = 0;
387 USHORT i;
388
389 for (i = sg_indx; i < io->cSGList; i++) {
390 if (i - sg_indx >= sg_max) {
391 /* we're beyond the number of S/G elements we can map */
392 break;
393 }
394
395 offset += io->pSGList[i].XferBufLen;
396 if (offset % io->BlockSize == 0) {
397 /* this S/G element ends on a sector boundary */
398 max_sector_cnt = offset / io->BlockSize;
399 max_sg_cnt = i + 1;
400 }
401 }
402
403 /* return the best match we found (0 indicating failure) */
404 *sector_cnt = max_sector_cnt;
405 *sg_cnt = max_sg_cnt;
406}
407
408
409/******************************************************************************
410 * Get device or media geometry. Device and media geometry are expected to be
411 * the same for non-removable devices, which will always be the case for the
412 * ATA devices we're dealing with (hard disks). ATAPI is a different story
413 * and handled by atapi_get_geometry().
414 */
415int ata_get_geometry(IORBH _far *iorb, int slot)
416{
417 ADD_WORKSPACE _far *aws = add_workspace(iorb);
418 int rc;
419
420 /* allocate buffer for ATA identify information */
421 if ((aws->buf = malloc(ATA_ID_WORDS * sizeof(u16))) == NULL) {
422 iorb_seterr(iorb, IOERR_CMD_SW_RESOURCE);
423 return(-1);
424 }
425
426 /* request ATA identify information */
427 aws->ppfunc = ata_get_geometry_pp;
428 rc = ata_cmd(ad_infos + iorb_unit_adapter(iorb),
429 iorb_unit_port(iorb),
430 iorb_unit_device(iorb),
431 slot,
432 ATA_CMD_ID_ATA,
433 AP_VADDR, (void _far *) aws->buf, ATA_ID_WORDS * sizeof(u16),
434 AP_END);
435
436 if (rc != 0) {
437 iorb_seterr(iorb, IOERR_CMD_ADD_SOFTWARE_FAILURE);
438 }
439
440 return(rc);
441}
442
443/******************************************************************************
444 * Post processing function for ata_get_geometry(): convert the ATA identify
445 * information to OS/2 IOCC_GEOMETRY information.
446 */
447void ata_get_geometry_pp(IORBH _far *iorb)
448{
449 GEOMETRY _far *geometry = ((IORB_GEOMETRY _far *) iorb)->pGeometry;
450 USHORT geometry_len = ((IORB_GEOMETRY _far *) iorb)->GeometryLen;
451 u16 *id_buf = add_workspace(iorb)->buf;
452 int a = iorb_unit_adapter(iorb);
453 int p = iorb_unit_port(iorb);
454
455 /* Fill-in geometry information; the ATA-8 spec declares the geometry
456 * fields in the ATA ID buffer as obsolete but it's still the best
457 * guess in most cases. If the information stored in the geometry
458 * fields is apparently incorrect, we'll use the algorithm typically
459 * used by SCSI adapters and modern PC BIOS versions:
460 *
461 * - 512 bytes per sector
462 * - 255 heads
463 * - 63 sectors per track (or 56 with the parameter "/4")
464 * - x cylinders (calculated)
465 *
466 * Please note that os2ahci currently does not natively support ATA sectors
467 * larger than 512 bytes, therefore relies on the translation logic built
468 * into the corresponding ATA disks. In order to prevent file systems that
469 * use block sizes larger than 512 bytes (FAT, JFS, ...) from ending up on
470 * incorrectly aligned physical sector accesses, hence using more physical
471 * I/Os than necessary, the command line parameter "/4" can be used to force
472 * a track size of 56 sectors. This way, partitions will start on 4K
473 * boundaries.
474 *
475 * Another limitation is that OS/2 has a 32-bit variable for the total number
476 * of sectors, limiting the maximum capacity to roughly 2TB. This is another
477 * issue that needs to be addressed sooner or later; large sectors could
478 * raise this limit to something like 8TB but this is not really much of a
479 * difference. Maybe there's something in later DDKs that allows more than
480 * 32 bits?
481 */
482 memset(geometry, 0x00, geometry_len);
483 geometry->BytesPerSector = ATA_SECTOR_SIZE;
484
485 /* extract total number of sectors */
486 if (id_buf[ATA_ID_CFS_ENABLE_2] & 0x400) {
487 /* 48-bit LBA supported */
488 if (ATA_CAPACITY48_H(id_buf) != 0) {
489 /* more than 32 bits for number of sectors */
490 dprintf("warning: limiting disk %d.%d.%d to 2TB\n",
491 iorb_unit_adapter(iorb), iorb_unit_port(iorb),
492 iorb_unit_device(iorb));
493 geometry->TotalSectors = 0xffffffffUL;
494 } else {
495 geometry->TotalSectors = ATA_CAPACITY48_L(id_buf);
496 }
497 } else {
498 /* 28-bit LBA */
499 geometry->TotalSectors = ATA_CAPACITY(id_buf) & 0x0fffffffUL;
500 }
501
502 /* fabricate the remaining geometry fields */
503 if (track_size[a][p] != 0) {
504 /* A specific track size has been requested for this port; this is
505 * typically done for disks with 4K sectors to make sure partitions
506 * start on 8-sector boundaries (parameter "/4").
507 */
508 geometry->NumHeads = 255;
509 geometry->SectorsPerTrack = track_size[a][p];
510 geometry->TotalCylinders = geometry->TotalSectors /
511 ((u32) geometry->NumHeads *
512 (u32) geometry->SectorsPerTrack);
513
514 } else if (CUR_HEADS(id_buf) > 0 && CUR_CYLS(id_buf) > 0 &&
515 CUR_SECTORS(id_buf) > 0 &&
516 CUR_CAPACITY(id_buf) == (u32) CUR_HEADS(id_buf) *
517 (u32) CUR_CYLS(id_buf) *
518 (u32) CUR_SECTORS(id_buf)) {
519 /* BIOS-supplied (aka "current") geometry values look valid */
520 geometry->NumHeads = CUR_HEADS(id_buf);
521 geometry->SectorsPerTrack = CUR_SECTORS(id_buf);
522 geometry->TotalCylinders = CUR_CYLS(id_buf);
523
524 } else if (ATA_HEADS(id_buf) > 0 && ATA_CYLS(id_buf) > 0 &&
525 ATA_SECTORS(id_buf) > 0) {
526 /* ATA-supplied values for geometry look valid */
527 geometry->NumHeads = ATA_HEADS(id_buf);
528 geometry->SectorsPerTrack = ATA_SECTORS(id_buf);
529 geometry->TotalCylinders = ATA_CYLS(id_buf);
530
531 } else {
532 /* use typical SCSI geometry */
533 geometry->NumHeads = 255;
534 geometry->SectorsPerTrack = 63;
535 geometry->TotalCylinders = geometry->TotalSectors /
536 ((u32) geometry->NumHeads *
537 (u32) geometry->SectorsPerTrack);
538 }
539
540 if (debug) {
541 printf("geometry information:\n");
542 printf(" heads: %d\n", (u16) geometry->NumHeads);
543 printf(" sectors: %d\n", (u16) geometry->SectorsPerTrack);
544 printf(" cylinders: %d\n", (u16) geometry->TotalCylinders);
545 printf(" capacity: %ldMB\n", (u32) (geometry->TotalSectors / 2048));
546 }
547
548 /* tell interrupt handler that this IORB is complete */
549 add_workspace(iorb)->complete = 1;
550}
551
552/******************************************************************************
553 * Test whether unit is ready.
554 */
555int ata_unit_ready(IORBH _far *iorb, int slot)
556{
557 /* This is a NOP for ATA devices (at least right now); returning an error
558 * without setting an error code means ahci_exec_iorb() will not queue any
559 * HW command and the IORB will complete successfully.
560 */
561 ((IORB_UNIT_STATUS _far *) iorb)->UnitStatus = US_READY | US_POWER;
562 return(-1);
563}
564
565/******************************************************************************
566 * Read sectors from AHCI device.
567 */
568int ata_read(IORBH _far *iorb, int slot)
569{
570 IORB_EXECUTEIO _far *io = (IORB_EXECUTEIO _far *) iorb;
571 AD_INFO *ai = ad_infos + iorb_unit_adapter(iorb);
572 ULONG sector = io->RBA + io->BlocksXferred;
573 USHORT count = io->BlockCount - io->BlocksXferred;
574 USHORT sg_indx;
575 USHORT sg_cnt;
576 int p = iorb_unit_port(iorb);
577 int d = iorb_unit_device(iorb);
578 int rc;
579
580 if (io->BlockCount == 0) {
581 /* NOP; return -1 without error in IORB to indicate success */
582 return(-1);
583 }
584
585 if (add_workspace(iorb)->unaligned) {
586 /* unaligned S/G addresses present; need to use double buffers */
587 return(ata_read_unaligned(iorb, slot));
588 }
589
590 /* Kludge: some I/O commands during boot use excessive S/G buffer lengths
591 * which cause NCQ commands to lock up. If there's only one S/G element
592 * and this element is already larger than what we can derive from the sector
593 * count, we'll adjust that element.
594 */
595 if (io->BlocksXferred == 0 && io->cSGList == 1 &&
596 io->pSGList[0].XferBufLen > (ULONG) io->BlockCount * io->BlockSize) {
597 io->pSGList[0].XferBufLen = (ULONG) io->BlockCount * io->BlockSize;
598 }
599
600 /* prepare read command while keeping an eye on S/G count limitations */
601 do {
602 sg_indx = ata_get_sg_indx(io);
603 sg_cnt = io->cSGList - sg_indx;
604 if ((rc = ata_cmd_read(iorb, ai, p, d, slot, sector, count,
605 io->pSGList + sg_indx, sg_cnt)) > 0) {
606 /* couldn't map all S/G elements */
607 ata_max_sg_cnt(io, sg_indx, (USHORT) rc, &sg_cnt, &count);
608 }
609 } while (rc > 0 && sg_cnt > 0);
610
611 if (rc == 0) {
612 add_workspace(iorb)->blocks = count;
613 add_workspace(iorb)->ppfunc = ata_read_pp;
614
615 } else if (rc > 0) {
616 iorb_seterr(iorb, IOERR_CMD_SGLIST_BAD);
617
618 } else if (rc == ATA_CMD_UNALIGNED_ADDR) {
619 /* unaligned S/G addresses detected; need to use double buffers */
620 add_workspace(iorb)->unaligned = 1;
621 return(ata_read_unaligned(iorb, slot));
622
623 } else {
624 iorb_seterr(iorb, IOERR_CMD_ADD_SOFTWARE_FAILURE);
625 }
626
627 return(rc);
628}
629
630/******************************************************************************
631 * Read sectors from AHCI device with unaligned S/G element addresses. AHCI
632 * only allows aligned S/G addresses while OS/2 doesn't have these kind of
633 * restrictions. This doesn't happen very often but when it does, we need to
634 * use a transfer buffer and copy the data manually.
635 */
636int ata_read_unaligned(IORBH _far *iorb, int slot)
637{
638 IORB_EXECUTEIO _far *io = (IORB_EXECUTEIO _far *) iorb;
639 ADD_WORKSPACE _far *aws = add_workspace(iorb);
640 AD_INFO *ai = ad_infos + iorb_unit_adapter(iorb);
641 ULONG sector = io->RBA + io->BlocksXferred;
642 SCATGATENTRY sg_single;
643 int p = iorb_unit_port(iorb);
644 int d = iorb_unit_device(iorb);
645 int rc;
646
647 ddprintf("ata_read_unaligned(%d.%d.%d, %ld)\n", ad_no(ai), p, d, sector);
648
649 /* allocate transfer buffer */
650 if ((aws->buf = malloc(io->BlockSize)) == NULL) {
651 iorb_seterr(iorb, IOERR_CMD_SW_RESOURCE);
652 return(-1);
653 }
654
655 /* prepare read command using transfer buffer */
656 sg_single.ppXferBuf = virt_to_phys(aws->buf);
657 sg_single.XferBufLen = io->BlockSize;
658 rc = ata_cmd_read(iorb, ai, p, d, slot, sector, 1, &sg_single, 1);
659
660 if (rc == 0) {
661 add_workspace(iorb)->blocks = 1;
662 add_workspace(iorb)->ppfunc = ata_read_pp;
663
664 } else if (rc > 0) {
665 iorb_seterr(iorb, IOERR_CMD_SGLIST_BAD);
666
667 } else {
668 iorb_seterr(iorb, IOERR_CMD_ADD_SOFTWARE_FAILURE);
669 }
670
671 return(rc);
672}
673
674/******************************************************************************
675 * Post processing function for ata_read(); this function updates the
676 * BlocksXferred counter in the IORB and, if not all blocks have been
677 * transferred, requeues the IORB to process the remaining sectors. It also
678 * takes care of copying data from the transfer buffer for unaligned reads.
679 */
680void ata_read_pp(IORBH _far *iorb)
681{
682 IORB_EXECUTEIO _far *io = (IORB_EXECUTEIO _far *) iorb;
683 ADD_WORKSPACE _far *aws = add_workspace(iorb);
684
685 if (aws->unaligned) {
686 /* copy transfer buffer to corresponding physical address in S/G list */
687 sg_memcpy(io->pSGList, io->cSGList,
688 (ULONG) io->BlocksXferred * (ULONG) io->BlockSize,
689 aws->buf, io->BlockSize, BUF_TO_SG);
690 }
691
692 io->BlocksXferred += add_workspace(iorb)->blocks;
693 dprintf("ata_read_pp(): blocks transferred = %d\n", (int) io->BlocksXferred);
694
695 if (io->BlocksXferred >= io->BlockCount) {
696 /* we're done; tell IRQ handler the IORB is complete */
697 add_workspace(iorb)->complete = 1;
698 } else {
699 /* requeue this IORB for next iteration */
700 iorb_requeue(iorb);
701 }
702}
703
704/******************************************************************************
705 * Verify readability of sectors on ATA device.
706 */
707int ata_verify(IORBH _far *iorb, int slot)
708{
709 IORB_EXECUTEIO _far *io = (IORB_EXECUTEIO _far *) iorb;
710 AD_INFO *ai = ad_infos + iorb_unit_adapter(iorb);
711 int p = iorb_unit_port(iorb);
712 int d = iorb_unit_device(iorb);
713 int rc;
714
715 if (io->BlockCount == 0) {
716 /* NOP; return -1 without error in IORB to indicate success */
717 return(-1);
718 }
719
720 /* prepare verify command */
721 if (io->RBA >= (1UL << 28) || io->BlockCount > 256) {
722 /* need LBA48 for this command */
723 if (!ai->ports[p].devs[d].lba48) {
724 iorb_seterr(iorb, IOERR_RBA_LIMIT);
725 return(-1);
726 }
727 rc = ata_cmd(ai, p, d, slot, ATA_CMD_VERIFY_EXT,
728 AP_SECTOR_48, (u32) io->RBA, (u16) 0,
729 AP_COUNT, (u16) io->BlockCount,
730 AP_DEVICE, 0x40,
731 AP_END);
732 } else {
733 rc = ata_cmd(ai, p, d, slot, ATA_CMD_VERIFY,
734 AP_SECTOR_28, (u32) io->RBA,
735 AP_COUNT, (u16) io->BlockCount & 0xffU,
736 AP_END);
737 }
738
739 return(rc);
740}
741
742/******************************************************************************
743 * Write sectors to AHCI device.
744 */
745int ata_write(IORBH _far *iorb, int slot)
746{
747 IORB_EXECUTEIO _far *io = (IORB_EXECUTEIO _far *) iorb;
748 AD_INFO *ai = ad_infos + iorb_unit_adapter(iorb);
749 ULONG sector = io->RBA + io->BlocksXferred;
750 USHORT count = io->BlockCount - io->BlocksXferred;
751 USHORT sg_indx;
752 USHORT sg_cnt;
753 int p = iorb_unit_port(iorb);
754 int d = iorb_unit_device(iorb);
755 int rc;
756
757 if (io->BlockCount == 0) {
758 /* NOP; return -1 without error in IORB to indicate success */
759 return(-1);
760 }
761
762 if (add_workspace(iorb)->unaligned) {
763 /* unaligned S/G addresses present; need to use double buffers */
764 return(ata_write_unaligned(iorb, slot));
765 }
766
767 /* prepare write command while keeping an eye on S/G count limitations */
768 do {
769 sg_indx = ata_get_sg_indx(io);
770 sg_cnt = io->cSGList - sg_indx;
771 if ((rc = ata_cmd_write(iorb, ai, p, d, slot, sector, count,
772 io->pSGList + sg_indx, sg_cnt,
773 io->Flags & XIO_DISABLE_HW_WRITE_CACHE)) > 0) {
774 /* couldn't map all S/G elements */
775 ata_max_sg_cnt(io, sg_indx, (USHORT) rc, &sg_cnt, &count);
776 }
777 } while (rc > 0 && sg_cnt > 0);
778
779 if (rc == 0) {
780 add_workspace(iorb)->blocks = count;
781 add_workspace(iorb)->ppfunc = ata_write_pp;
782
783 } else if (rc > 0) {
784 iorb_seterr(iorb, IOERR_CMD_SGLIST_BAD);
785
786 } else if (rc == ATA_CMD_UNALIGNED_ADDR) {
787 /* unaligned S/G addresses detected; need to use double buffers */
788 add_workspace(iorb)->unaligned = 1;
789 return(ata_write_unaligned(iorb, slot));
790
791 } else {
792 iorb_seterr(iorb, IOERR_CMD_ADD_SOFTWARE_FAILURE);
793 }
794
795 return(rc);
796}
797
798/******************************************************************************
799 * Write sectors from AHCI device with unaligned S/G element addresses. AHCI
800 * only allows aligned S/G addresses while OS/2 doesn't have these kind of
801 * restrictions. This doesn't happen very often but when it does, we need to
802 * use a transfer buffer and copy the data manually.
803 */
804int ata_write_unaligned(IORBH _far *iorb, int slot)
805{
806 IORB_EXECUTEIO _far *io = (IORB_EXECUTEIO _far *) iorb;
807 ADD_WORKSPACE _far *aws = add_workspace(iorb);
808 AD_INFO *ai = ad_infos + iorb_unit_adapter(iorb);
809 ULONG sector = io->RBA + io->BlocksXferred;
810 SCATGATENTRY sg_single;
811 int p = iorb_unit_port(iorb);
812 int d = iorb_unit_device(iorb);
813 int rc;
814
815 ddprintf("ata_write_unaligned(%d.%d.%d, %ld)\n", ad_no(ai), p, d, sector);
816
817 /* allocate transfer buffer */
818 if ((aws->buf = malloc(io->BlockSize)) == NULL) {
819 iorb_seterr(iorb, IOERR_CMD_SW_RESOURCE);
820 return(-1);
821 }
822
823 /* copy next sector from S/G list to transfer buffer */
824 sg_memcpy(io->pSGList, io->cSGList,
825 (ULONG) io->BlocksXferred * (ULONG) io->BlockSize,
826 aws->buf, io->BlockSize, SG_TO_BUF);
827
828 /* prepare write command using transfer buffer */
829 sg_single.ppXferBuf = virt_to_phys(aws->buf);
830 sg_single.XferBufLen = io->BlockSize;
831 rc = ata_cmd_write(iorb, ai, p, d, slot, sector, 1, &sg_single, 1,
832 io->Flags & XIO_DISABLE_HW_WRITE_CACHE);
833
834 if (rc == 0) {
835 add_workspace(iorb)->blocks = 1;
836 add_workspace(iorb)->ppfunc = ata_write_pp;
837
838 } else if (rc > 0) {
839 iorb_seterr(iorb, IOERR_CMD_SGLIST_BAD);
840
841 } else {
842 iorb_seterr(iorb, IOERR_CMD_ADD_SOFTWARE_FAILURE);
843 }
844
845 return(rc);
846}
847
848
849/******************************************************************************
850 * Post processing function for ata_write(); this function updates the
851 * BlocksXferred counter in the IORB and, if not all blocks have been
852 * transferred, requeues the IORB to process the remaining sectors.
853 */
854void ata_write_pp(IORBH _far *iorb)
855{
856 IORB_EXECUTEIO _far *io = (IORB_EXECUTEIO _far *) iorb;
857
858 io->BlocksXferred += add_workspace(iorb)->blocks;
859 dprintf("ata_write_pp(): blocks transferred = %d\n", (int) io->BlocksXferred);
860
861 if (io->BlocksXferred >= io->BlockCount) {
862 /* we're done; tell IRQ handler the IORB is complete */
863 add_workspace(iorb)->complete = 1;
864 } else {
865 /* requeue this IORB for next iteration */
866 iorb_requeue(iorb);
867 }
868}
869
870/******************************************************************************
871 * Execute ATA command.
872 */
873int ata_execute_ata(IORBH _far *iorb, int slot)
874{
875 IORB_ADAPTER_PASSTHRU _far *apt = (IORB_ADAPTER_PASSTHRU _far *) iorb;
876 AD_INFO *ai = ad_infos + iorb_unit_adapter(iorb);
877 int p = iorb_unit_port(iorb);
878 int d = iorb_unit_device(iorb);
879 int rc;
880
881 if (apt->ControllerCmdLen != sizeof(ATA_CMD)) {
882 iorb_seterr(iorb, IOERR_CMD_SYNTAX);
883 return(-1);
884 }
885
886 rc = ata_cmd(ai, p, d, slot, 0,
887 AP_SGLIST, apt->pSGList, apt->cSGList,
888 AP_ATA_CMD, apt->pControllerCmd,
889 AP_WRITE, !(apt->Flags & PT_DIRECTION_IN),
890 AP_END);
891
892 if (rc == 0) {
893 add_workspace(iorb)->ppfunc = ata_execute_ata_pp;
894 }
895
896 return(rc);
897}
898
899/******************************************************************************
900 * Post processing function for ata_execute_ata(); the main purpose of this
901 * function is to copy the received D2H FIS (i.e. the device registers after
902 * command completion) back to the ATA command structure.
903 *
904 * See ata_cmd_to_fis() for an explanation of the mapping.
905 */
906void ata_execute_ata_pp(IORBH _far *iorb)
907{
908 AHCI_PORT_DMA _far *dma_base;
909 ATA_CMD _far *cmd;
910 AD_INFO *ai;
911 u8 _far *fis;
912 int p;
913
914 /* get address of D2H FIS */
915 ai = ad_infos + iorb_unit_adapter(iorb);
916 p = iorb_unit_port(iorb);
917 dma_base = port_dma_base(ai, p);
918 fis = dma_base->rx_fis + 0x40;
919
920 if (fis[0] != 0x34) {
921 /* this is not a D2H FIS - give up silently */
922 ddprintf("ata_execute_ata_pp(): D2H FIS type incorrect: %d\n", fis[0]);
923 add_workspace(iorb)->complete = 1;
924 return;
925 }
926
927 /* map D2H FIS to the original ATA controller command structure */
928 cmd = (ATA_CMD _far *) ((IORB_ADAPTER_PASSTHRU _far *) iorb)->pControllerCmd;
929
930 cmd->cmd = fis[2];
931 cmd->device = fis[7];
932 cmd->features = ((u16) fis[3])
933 | ((u16) fis[11]);
934 cmd->lba_l = ((u32) fis[4])
935 | ((u32) fis[5] << 8)
936 | ((u32) fis[6] << 16)
937 | ((u32) fis[8] << 24);
938 cmd->lba_h = ((u16) fis[9])
939 | ((u16) fis[10] << 8);
940 cmd->count = ((u16) fis[12])
941 | ((u16) fis[13] << 8);
942
943 dphex(cmd, sizeof(*cmd), "ahci_execute_ata_pp(): cmd after completion:\n");
944
945 /* signal completion to interrupt handler */
946 add_workspace(iorb)->complete = 1;
947}
948
949/******************************************************************************
950 * Request sense information for a failed command. Since there is no "request
951 * sense" command for ATA devices, we need to read the current error code from
952 * the AHCI task file register and fabricate the sense information.
953 *
954 * NOTES:
955 *
956 * - This function must be called right after an ATA command has failed and
957 * before any other commands are queued on the corresponding port. This
958 * function is typically called in the port restart context hook which is
959 * triggered by an AHCI error interrupt.
960 *
961 * - The ATA error bits are a complete mess. We'll try and catch the most
962 * interesting error codes (such as medium errors) and report everything
963 * else with a generic error code.
964 */
965int ata_req_sense(IORBH _far *iorb, int slot)
966{
967 AD_INFO *ai = ad_infos + iorb_unit_adapter(iorb);
968 u8 _far *port_mmio = port_base(ai, iorb_unit_port(iorb));
969 u32 tf_data = readl(port_mmio + PORT_TFDATA);
970 u8 err = (u8) (tf_data >> 8);
971 u8 sts = (u8) (tf_data);
972
973 if (sts & ATA_ERR) {
974 if (sts & ATA_DF) {
975 /* there is a device-specific error condition */
976 if (err & ATA_ICRC) {
977 iorb_seterr(iorb, IOERR_ADAPTER_DEVICEBUSCHECK);
978 } else if (err & ATA_UNC) {
979 iorb_seterr(iorb, IOERR_MEDIA);
980 } else if (err & ATA_IDNF) {
981 iorb_seterr(iorb, IOERR_RBA_ADDRESSING_ERROR);
982 } else {
983 iorb_seterr(iorb, IOERR_DEVICE_NONSPECIFIC);
984 }
985
986 } else {
987 iorb_seterr(iorb, IOERR_DEVICE_NONSPECIFIC);
988 }
989 } else {
990 /* this function only gets called when we received an error interrupt */
991 iorb_seterr(iorb, IOERR_DEVICE_NONSPECIFIC);
992 }
993
994 /* Return an error to indicate there's no HW command to be submitted and
995 * that the IORB can be completed "as is" (the upstream code expects the
996 * IORB error code, if any, to be set when this happens and this is exactly
997 * what this function is all about).
998 */
999 return(-1);
1000}
1001
1002/******************************************************************************
1003 * Extract vendor and device name from an ATA INDENTIFY buffer. Since strings
1004 * in the indentify buffer are byte-swapped, we need to swap them back.
1005 */
1006char *ata_dev_name(u16 *id_buf)
1007{
1008 static char dev_name[ATA_ID_PROD_LEN + 1];
1009 char *t = dev_name;
1010 char *s = (char *) (id_buf + ATA_ID_PROD);
1011 int i;
1012
1013 dev_name[sizeof(dev_name)-1] = '\0';
1014
1015 for (i = 0; i < ATA_ID_PROD_LEN / 2; i++) {
1016 *(t++) = s[1];
1017 *(t++) = s[0];
1018 s += 2;
1019 }
1020
1021 return(dev_name);
1022}
1023
1024/******************************************************************************
1025 * Fabricate ATA READ command based on the capabilities of the corresponding
1026 * device and the paramters set from above (NCQ, etc).
1027 */
1028static int ata_cmd_read(IORBH _far *iorb, AD_INFO *ai, int p, int d, int slot,
1029 ULONG sector, ULONG count, SCATGATENTRY _far *sg_list,
1030 ULONG sg_cnt)
1031{
1032 int rc;
1033
1034 if (sector >= (1UL << 28) || count > 256 || add_workspace(iorb)->is_ncq) {
1035 /* need LBA48 for this command */
1036 if (!ai->ports[p].devs[d].lba48) {
1037 iorb_seterr(iorb, IOERR_RBA_LIMIT);
1038 return(-1);
1039 }
1040 if (add_workspace(iorb)->is_ncq) {
1041 /* use NCQ read; count goes into feature register, tag into count! */
1042 rc = ata_cmd(ai, p, d, slot, ATA_CMD_FPDMA_READ,
1043 AP_SECTOR_48, (u32) sector, (u16) 0,
1044 AP_FEATURES, (u16) count,
1045 AP_COUNT, (u16) (slot << 3), /* tag == slot */
1046 AP_SGLIST, sg_list, (u16) sg_cnt,
1047 AP_DEVICE, 0x40,
1048 AP_END);
1049 } else {
1050 rc = ata_cmd(ai, p, d, slot, ATA_CMD_READ_EXT,
1051 AP_SECTOR_48, (u32) sector, (u16) 0,
1052 AP_COUNT, (u16) count,
1053 AP_SGLIST, sg_list, (u16) sg_cnt,
1054 AP_DEVICE, 0x40,
1055 AP_END);
1056 }
1057
1058 } else {
1059 rc = ata_cmd(ai, p, d, slot, ATA_CMD_READ,
1060 AP_SECTOR_28, (u32) sector,
1061 AP_COUNT, (u16) count & 0xffU,
1062 AP_SGLIST, sg_list, (u16) sg_cnt,
1063 AP_DEVICE, 0x40,
1064 AP_END);
1065 }
1066
1067 return(rc);
1068}
1069
1070/******************************************************************************
1071 * Fabricate ATA WRITE command based on the capabilities of the corresponding
1072 * device and the paramters set from above (NCQ, etc)
1073 */
1074static int ata_cmd_write(IORBH _far *iorb, AD_INFO *ai, int p, int d, int slot,
1075 ULONG sector, ULONG count, SCATGATENTRY _far *sg_list,
1076 ULONG sg_cnt, int write_through)
1077{
1078 int rc;
1079
1080 if (sector >= (1UL << 28) || count > 256 || add_workspace(iorb)->is_ncq) {
1081 /* need LBA48 for this command */
1082 if (!ai->ports[p].devs[d].lba48) {
1083 iorb_seterr(iorb, IOERR_RBA_LIMIT);
1084 return(-1);
1085 }
1086 if (add_workspace(iorb)->is_ncq) {
1087 /* use NCQ write; count goes into feature register, tag into count! */
1088 rc = ata_cmd(ai, p, d, slot, ATA_CMD_FPDMA_WRITE,
1089 AP_SECTOR_48, (u32) sector, (u16) 0,
1090 AP_FEATURES, (u16) count,
1091 /* tag = slot */
1092 AP_COUNT, (u16) (slot << 3),
1093 AP_SGLIST, sg_list, (u16) sg_cnt,
1094 AP_DEVICE, 0x40,
1095 /* force unit access */
1096 AP_DEVICE, (write_through && !force_write_cache) ? 0x80 : 0,
1097 AP_WRITE, 1,
1098 AP_END);
1099 } else {
1100 rc = ata_cmd(ai, p, d, slot, ATA_CMD_WRITE_EXT,
1101 AP_SECTOR_48, (u32) sector, (u16) 0,
1102 AP_COUNT, (u16) count,
1103 AP_SGLIST, sg_list, (u16) sg_cnt,
1104 AP_DEVICE, 0x40,
1105 AP_WRITE, 1,
1106 AP_END);
1107 }
1108
1109 } else {
1110 rc = ata_cmd(ai, p, d, slot, ATA_CMD_WRITE,
1111 AP_SECTOR_28, (u32) sector,
1112 AP_COUNT, (u16) count & 0xffU,
1113 AP_SGLIST, sg_list, (u16) sg_cnt,
1114 AP_DEVICE, 0x40,
1115 AP_WRITE, 1,
1116 AP_END);
1117 }
1118
1119 return(rc);
1120}
Note: See TracBrowser for help on using the repository browser.