VirtualBox

source: vbox/trunk/src/VBox/Devices/PC/BIOS-new/MakeDebianBiosAssembly.cpp@ 41508

Last change on this file since 41508 was 41508, checked in by vboxsync, 13 years ago

Not needed either.

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 52.8 KB
Line 
1/* $Id: MakeDebianBiosAssembly.cpp 41508 2012-05-30 19:30:54Z vboxsync $ */
2/** @file
3 * MakeDebianBiosAssembly - Generate Assembly Source for Debian-minded Distros.
4 */
5
6/*
7 * Copyright (C) 2012 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 */
17
18
19/*******************************************************************************
20* Header Files *
21*******************************************************************************/
22#include <iprt/asm.h>
23#include <iprt/buildconfig.h>
24#include <iprt/ctype.h>
25#include <iprt/dbg.h>
26#include <iprt/file.h>
27#include <iprt/getopt.h>
28#include <iprt/initterm.h>
29#include <iprt/mem.h>
30#include <iprt/message.h>
31#include <iprt/string.h>
32#include <iprt/stream.h>
33#include <iprt/x86.h>
34
35#include <VBox/dis.h>
36
37
38/*******************************************************************************
39* Defined Constants And Macros *
40*******************************************************************************/
41/** The flat ROM base address. */
42#define VBOX_BIOS_BASE UINT32_C(0xf0000)
43
44
45/*******************************************************************************
46* Structures and Typedefs *
47*******************************************************************************/
48/**
49 * A BIOS segment.
50 */
51typedef struct BIOSSEG
52{
53 char szName[32];
54 char szClass[32];
55 char szGroup[32];
56 RTFAR16 Address;
57 uint32_t uFlatAddr;
58 uint32_t cb;
59} BIOSSEG;
60/** Pointer to a BIOS segment. */
61typedef BIOSSEG *PBIOSSEG;
62
63
64/**
65 * Pointer to a BIOS map parser handle.
66 */
67typedef struct BIOSMAP
68{
69 /** The stream pointer. */
70 PRTSTREAM hStrm;
71 /** The file name. */
72 const char *pszMapFile;
73 /** Set when EOF has been reached. */
74 bool fEof;
75 /** The current line number (0 based).*/
76 uint32_t iLine;
77 /** The length of the current line. */
78 uint32_t cch;
79 /** The offset of the first non-white character on the line. */
80 uint32_t offNW;
81 /** The line buffer. */
82 char szLine[16384];
83} BIOSMAP;
84/** Pointer to a BIOS map parser handle. */
85typedef BIOSMAP *PBIOSMAP;
86
87
88/*******************************************************************************
89* Global Variables *
90*******************************************************************************/
91static unsigned g_cVerbose = 1 /*0*/;
92/** Pointer to the BIOS image. */
93static uint8_t const *g_pbImg;
94/** The size of the BIOS image. */
95static size_t g_cbImg;
96
97/** Debug module for the map file. */
98static RTDBGMOD g_hMapMod = NIL_RTDBGMOD;
99/** The number of BIOS segments found in the map file. */
100static uint32_t g_cSegs = 0;
101/** Array of BIOS segments from the map file. */
102static BIOSSEG g_aSegs[32];
103
104/** The output stream. */
105static PRTSTREAM g_hStrmOutput = NULL;
106
107
108static bool outputPrintfV(const char *pszFormat, va_list va)
109{
110 int rc = RTStrmPrintfV(g_hStrmOutput, pszFormat, va);
111 if (RT_FAILURE(rc))
112 {
113 RTMsgError("Output error: %Rrc\n", rc);
114 return false;
115 }
116 return true;
117}
118
119
120static bool outputPrintf(const char *pszFormat, ...)
121{
122 va_list va;
123 va_start(va, pszFormat);
124 bool fRc = outputPrintfV(pszFormat, va);
125 va_end(va);
126 return fRc;
127}
128
129
130/**
131 * Opens the output file for writing.
132 *
133 * @returns RTEXITCODE_SUCCESS or RTEXITCODE_FAILURE+msg.
134 * @param pszOutput Path to the output file.
135 */
136static RTEXITCODE OpenOutputFile(const char *pszOutput)
137{
138 if (!pszOutput)
139 g_hStrmOutput = g_pStdOut;
140 else
141 {
142 int rc = RTStrmOpen(pszOutput, "w", &g_hStrmOutput);
143 if (RT_FAILURE(rc))
144 return RTMsgErrorExit(RTEXITCODE_FAILURE, "Failed to open output file '%s': %Rrc", pszOutput, rc);
145 }
146 return RTEXITCODE_SUCCESS;
147}
148
149
150/**
151 * Displays a disassembly error and returns @c false.
152 *
153 * @returns @c false.
154 * @param pszFormat The error format string.
155 * @param ... Format argument.
156 */
157static bool disError(const char *pszFormat, ...)
158{
159 va_list va;
160 va_start(va, pszFormat);
161 RTMsgErrorV(pszFormat, va);
162 va_end(va);
163 return false;
164}
165
166
167/**
168 * Output the disassembly file header.
169 *
170 * @returns @c true on success,
171 */
172static bool disFileHeader(void)
173{
174 return outputPrintf("; $Id: MakeDebianBiosAssembly.cpp 41508 2012-05-30 19:30:54Z vboxsync $ \n"
175 ";; @file\n"
176 "; Auto Generated source file. Do not edit.\n"
177 ";\n"
178 "\n"
179 "org 0xf000\n"
180 "\n"
181 );
182}
183
184
185/**
186 * Checks if a byte sequence could be a string litteral.
187 *
188 * @returns @c true if it is, @c false if it isn't.
189 * @param uFlatAddr The address of the byte sequence.
190 * @param cb The length of the sequence.
191 */
192static bool disIsString(uint32_t uFlatAddr, uint32_t cb)
193{
194 if (cb < 6)
195 return false;
196
197 uint8_t const *pb = &g_pbImg[uFlatAddr - VBOX_BIOS_BASE];
198 while (cb > 0)
199 {
200 if ( !RT_C_IS_PRINT(*pb)
201 && *pb != '\r'
202 && *pb != '\n'
203 && *pb != '\t')
204 {
205 if (*pb == '\0')
206 {
207 do
208 {
209 pb++;
210 cb--;
211 } while (cb > 0 && *pb == '\0');
212 return cb == 0;
213 }
214 return false;
215 }
216 pb++;
217 cb--;
218 }
219
220 return true;
221}
222
223
224/**
225 * Checks if a dword could be a far 16:16 BIOS address.
226 *
227 * @returns @c true if it is, @c false if it isn't.
228 * @param uFlatAddr The address of the dword.
229 */
230static bool disIsFarBiosAddr(uint32_t uFlatAddr)
231{
232 uint16_t const *pu16 = (uint16_t const *)&g_pbImg[uFlatAddr - VBOX_BIOS_BASE];
233 if (pu16[1] < 0xf000)
234 return false;
235 if (pu16[1] > 0xfff0)
236 return false;
237 uint32_t uFlatAddr2 = (uint32_t)(pu16[1] << 4) | pu16[0];
238 if (uFlatAddr2 >= VBOX_BIOS_BASE + _64K)
239 return false;
240 return true;
241}
242
243
244static bool disByteData(uint32_t uFlatAddr, uint32_t cb)
245{
246 uint8_t const *pb = &g_pbImg[uFlatAddr - VBOX_BIOS_BASE];
247 size_t cbOnLine = 0;
248 while (cb-- > 0)
249 {
250 bool fRc;
251 if (cbOnLine >= 16)
252 {
253 fRc = outputPrintf("\n"
254 " db 0%02xh", *pb);
255 cbOnLine = 1;
256 }
257 else if (!cbOnLine)
258 {
259 fRc = outputPrintf(" db 0%02xh", *pb);
260 cbOnLine = 1;
261 }
262 else
263 {
264 fRc = outputPrintf(", 0%02xh", *pb);
265 cbOnLine++;
266 }
267 if (!fRc)
268 return false;
269 pb++;
270 }
271 return outputPrintf("\n");
272}
273
274
275static bool disWordData(uint32_t uFlatAddr, uint32_t cb)
276{
277 if (cb & 1)
278 return disError("disWordData expects word aligned size: cb=%#x uFlatAddr=%#x", uFlatAddr, cb);
279
280 uint16_t const *pu16 = (uint16_t const *)&g_pbImg[uFlatAddr - VBOX_BIOS_BASE];
281 size_t cbOnLine = 0;
282 while (cb > 0)
283 {
284 bool fRc;
285 if (cbOnLine >= 16)
286 {
287 fRc = outputPrintf("\n"
288 " dw 0%04xh", *pu16);
289 cbOnLine = 2;
290 }
291 else if (!cbOnLine)
292 {
293 fRc = outputPrintf(" dw 0%04xh", *pu16);
294 cbOnLine = 2;
295 }
296 else
297 {
298 fRc = outputPrintf(", 0%04xh", *pu16);
299 cbOnLine += 2;
300 }
301 if (!fRc)
302 return false;
303 pu16++;
304 cb -= 2;
305 }
306 return outputPrintf("\n");
307}
308
309
310static bool disDWordData(uint32_t uFlatAddr, uint32_t cb)
311{
312 if (cb & 3)
313 return disError("disWordData expects dword aligned size: cb=%#x uFlatAddr=%#x", uFlatAddr, cb);
314
315 uint32_t const *pu32 = (uint32_t const *)&g_pbImg[uFlatAddr - VBOX_BIOS_BASE];
316 size_t cbOnLine = 0;
317 while (cb > 0)
318 {
319 bool fRc;
320 if (cbOnLine >= 16)
321 {
322 fRc = outputPrintf("\n"
323 " dd 0%08xh", *pu32);
324 cbOnLine = 4;
325 }
326 else if (!cbOnLine)
327 {
328 fRc = outputPrintf(" dd 0%08xh", *pu32);
329 cbOnLine = 4;
330 }
331 else
332 {
333 fRc = outputPrintf(", 0%08xh", *pu32);
334 cbOnLine += 4;
335 }
336 if (!fRc)
337 return false;
338 pu32++;
339 cb -= 4;
340 }
341 return outputPrintf("\n");
342}
343
344
345static bool disStringData(uint32_t uFlatAddr, uint32_t cb)
346{
347 uint8_t const *pb = &g_pbImg[uFlatAddr - VBOX_BIOS_BASE];
348 uint32_t cchOnLine = 0;
349 while (cb > 0)
350 {
351 /* Line endings and beginnings. */
352 if (cchOnLine >= 72)
353 {
354 if (!outputPrintf("\n"))
355 return false;
356 cchOnLine = 0;
357 }
358 if ( !cchOnLine
359 && !outputPrintf(" db "))
360 return false;
361
362 /* See how many printable character we've got. */
363 uint32_t cchPrintable = 0;
364 while ( cchPrintable < cb
365 && RT_C_IS_PRINT(pb[cchPrintable])
366 && pb[cchPrintable] != '\'')
367 cchPrintable++;
368
369 bool fRc = true;
370 if (cchPrintable)
371 {
372 if (cchPrintable + cchOnLine > 72)
373 cchPrintable = 72 - cchOnLine;
374 if (cchOnLine)
375 {
376 fRc = outputPrintf(", '%.*s'", cchPrintable, pb);
377 cchOnLine += 4 + cchPrintable;
378 }
379 else
380 {
381 fRc = outputPrintf("'%.*s'", cchPrintable, pb);
382 cchOnLine += 2 + cchPrintable;
383 }
384 pb += cchPrintable;
385 cb -= cchPrintable;
386 }
387 else
388 {
389 if (cchOnLine)
390 {
391 fRc = outputPrintf(", 0%02xh", *pb);
392 cchOnLine += 6;
393 }
394 else
395 {
396 fRc = outputPrintf("0%02xh", *pb);
397 cchOnLine += 4;
398 }
399 pb++;
400 cb--;
401 }
402 if (!fRc)
403 return false;
404 }
405 return outputPrintf("\n");
406}
407
408
409/**
410 * For dumping a portion of a string table.
411 *
412 * @returns @c true on success, @c false on failure.
413 * @param uFlatAddr The start address.
414 * @param cb The size of the string table.
415 */
416static bool disStringsData(uint32_t uFlatAddr, uint32_t cb)
417{
418 uint8_t const *pb = &g_pbImg[uFlatAddr - VBOX_BIOS_BASE];
419 uint32_t cchOnLine = 0;
420 uint8_t bPrev = 255;
421 while (cb > 0)
422 {
423 /* Line endings and beginnings. */
424 if ( cchOnLine >= 72
425 || (bPrev == '\0' && *pb != '\0'))
426 {
427 if (!outputPrintf("\n"))
428 return false;
429 cchOnLine = 0;
430 }
431 if ( !cchOnLine
432 && !outputPrintf(" db "))
433 return false;
434
435 /* See how many printable character we've got. */
436 uint32_t cchPrintable = 0;
437 while ( cchPrintable < cb
438 && RT_C_IS_PRINT(pb[cchPrintable])
439 && pb[cchPrintable] != '\'')
440 cchPrintable++;
441
442 bool fRc = true;
443 if (cchPrintable)
444 {
445 if (cchPrintable + cchOnLine > 72)
446 cchPrintable = 72 - cchOnLine;
447 if (cchOnLine)
448 {
449 fRc = outputPrintf(", '%.*s'", cchPrintable, pb);
450 cchOnLine += 4 + cchPrintable;
451 }
452 else
453 {
454 fRc = outputPrintf("'%.*s'", cchPrintable, pb);
455 cchOnLine += 2 + cchPrintable;
456 }
457 pb += cchPrintable;
458 cb -= cchPrintable;
459 }
460 else
461 {
462 if (cchOnLine)
463 {
464 fRc = outputPrintf(", 0%02xh", *pb);
465 cchOnLine += 6;
466 }
467 else
468 {
469 fRc = outputPrintf("0%02xh", *pb);
470 cchOnLine += 4;
471 }
472 pb++;
473 cb--;
474 }
475 if (!fRc)
476 return false;
477 bPrev = pb[-1];
478 }
479 return outputPrintf("\n");
480}
481
482
483/**
484 * Minds the gap between two segments.
485 *
486 * Gaps should generally be zero filled.
487 *
488 * @returns @c true on success, @c false on failure.
489 * @param uFlatAddr The address of the gap.
490 * @param cbPadding The size of the gap.
491 */
492static bool disCopySegmentGap(uint32_t uFlatAddr, uint32_t cbPadding)
493{
494 if (g_cVerbose > 0)
495 outputPrintf("\n"
496 " ; Padding %#x bytes at %#x\n", cbPadding, uFlatAddr);
497 uint8_t const *pb = &g_pbImg[uFlatAddr - VBOX_BIOS_BASE];
498 if (!ASMMemIsAll8(pb, cbPadding, 0))
499 return outputPrintf(" times %u db 0\n", cbPadding);
500
501 return disByteData(uFlatAddr, cbPadding);
502}
503
504
505/**
506 * Worker for disGetNextSymbol that only does the looking up, no RTDBSYMBOL::cb
507 * calc.
508 *
509 * @param uFlatAddr The address to start searching at.
510 * @param cbMax The size of the search range.
511 * @param poff Where to return the offset between the symbol
512 * and @a uFlatAddr.
513 * @param pSym Where to return the symbol data.
514 */
515static void disGetNextSymbolWorker(uint32_t uFlatAddr, uint32_t cbMax, uint32_t *poff, PRTDBGSYMBOL pSym)
516{
517 RTINTPTR off = 0;
518 int rc = RTDbgModSymbolByAddr(g_hMapMod, RTDBGSEGIDX_RVA, uFlatAddr, RTDBGSYMADDR_FLAGS_GREATER_OR_EQUAL, &off, pSym);
519 if (RT_SUCCESS(rc))
520 {
521 /* negative offset, indicates beyond. */
522 if (off <= 0)
523 {
524 *poff = (uint32_t)-off;
525 return;
526 }
527
528 outputPrintf(" ; !! RTDbgModSymbolByAddr(,,%#x,,) -> off=%RTptr cb=%RTptr uValue=%RTptr '%s'\n",
529 uFlatAddr, off, pSym->cb, pSym->Value, pSym->szName);
530 }
531 else if (rc != VERR_SYMBOL_NOT_FOUND)
532 outputPrintf(" ; !! RTDbgModSymbolByAddr(,,%#x,,) -> %Rrc\n", uFlatAddr, rc);
533
534 RTStrPrintf(pSym->szName, sizeof(pSym->szName), "_dummy_addr_%#x", uFlatAddr + cbMax);
535 pSym->Value = uFlatAddr + cbMax;
536 pSym->cb = 0;
537 pSym->offSeg = uFlatAddr + cbMax;
538 pSym->iSeg = RTDBGSEGIDX_RVA;
539 pSym->iOrdinal = 0;
540 pSym->fFlags = 0;
541 *poff = cbMax;
542}
543
544
545/**
546 * Gets the symbol at or after the given address.
547 *
548 * If there are no symbols in the specified range, @a pSym and @a poff will be
549 * set up to indicate a symbol at the first byte after the range.
550 *
551 * @param uFlatAddr The address to start searching at.
552 * @param cbMax The size of the search range.
553 * @param poff Where to return the offset between the symbol
554 * and @a uFlatAddr.
555 * @param pSym Where to return the symbol data.
556 */
557static void disGetNextSymbol(uint32_t uFlatAddr, uint32_t cbMax, uint32_t *poff, PRTDBGSYMBOL pSym)
558{
559 disGetNextSymbolWorker(uFlatAddr, cbMax, poff, pSym);
560 if ( *poff < cbMax
561 && pSym->cb == 0)
562 {
563 if (*poff + 1 < cbMax)
564 {
565 uint32_t off2;
566 RTDBGSYMBOL Sym2;
567 disGetNextSymbolWorker(uFlatAddr + *poff + 1, cbMax - *poff - 1, &off2, &Sym2);
568 pSym->cb = off2 + 1;
569 }
570 else
571 pSym->cb = 1;
572 }
573 if (pSym->cb > cbMax - *poff)
574 pSym->cb = cbMax - *poff;
575
576 if (g_cVerbose > 1)
577 outputPrintf(" ; disGetNextSymbol %#x LB %#x -> off=%#x cb=%RTptr uValue=%RTptr '%s'\n",
578 uFlatAddr, cbMax, *poff, pSym->cb, pSym->Value, pSym->szName);
579
580}
581
582
583/**
584 * For dealing with the const segment (string constants).
585 *
586 * @returns @c true on success, @c false on failure.
587 * @param iSeg The segment.
588 */
589static bool disConstSegment(uint32_t iSeg)
590{
591 uint32_t uFlatAddr = g_aSegs[iSeg].uFlatAddr;
592 uint32_t cb = g_aSegs[iSeg].cb;
593
594 while (cb > 0)
595 {
596 uint32_t off;
597 RTDBGSYMBOL Sym;
598 disGetNextSymbol(uFlatAddr, cb, &off, &Sym);
599
600 if (off > 0)
601 {
602 if (!disStringsData(uFlatAddr, off))
603 return false;
604 cb -= off;
605 uFlatAddr += off;
606 off = 0;
607 if (!cb)
608 break;
609 }
610
611 bool fRc;
612 if (off == 0)
613 {
614 size_t cchName = strlen(Sym.szName);
615 fRc = outputPrintf("%s: %*s; %#x LB %#x\n", Sym.szName, cchName < 41 - 2 ? cchName - 41 - 2 : 0, "", uFlatAddr, Sym.cb);
616 if (!fRc)
617 return false;
618 fRc = disStringsData(uFlatAddr, Sym.cb);
619 uFlatAddr += Sym.cb;
620 cb -= Sym.cb;
621 }
622 else
623 {
624 fRc = disStringsData(uFlatAddr, Sym.cb);
625 uFlatAddr += cb;
626 cb = 0;
627 }
628 if (!fRc)
629 return false;
630 }
631
632 return true;
633}
634
635
636
637static bool disDataSegment(uint32_t iSeg)
638{
639 uint32_t uFlatAddr = g_aSegs[iSeg].uFlatAddr;
640 uint32_t cb = g_aSegs[iSeg].cb;
641
642 while (cb > 0)
643 {
644 uint32_t off;
645 RTDBGSYMBOL Sym;
646 disGetNextSymbol(uFlatAddr, cb, &off, &Sym);
647
648 if (off > 0)
649 {
650 if (!disByteData(uFlatAddr, off))
651 return false;
652 cb -= off;
653 uFlatAddr += off;
654 off = 0;
655 if (!cb)
656 break;
657 }
658
659 bool fRc;
660 if (off == 0)
661 {
662 size_t cchName = strlen(Sym.szName);
663 fRc = outputPrintf("%s: %*s; %#x LB %#x\n", Sym.szName, cchName < 41 - 2 ? cchName - 41 - 2 : 0, "", uFlatAddr, Sym.cb);
664 if (!fRc)
665 return false;
666
667 if (Sym.cb == 2)
668 fRc = disWordData(uFlatAddr, 2);
669 //else if (Sym.cb == 4 && disIsFarBiosAddr(uFlatAddr))
670 // fRc = disDWordData(uFlatAddr, 4);
671 else if (Sym.cb == 4)
672 fRc = disDWordData(uFlatAddr, 4);
673 else if (disIsString(uFlatAddr, Sym.cb))
674 fRc = disStringData(uFlatAddr, Sym.cb);
675 else
676 fRc = disByteData(uFlatAddr, Sym.cb);
677
678 uFlatAddr += Sym.cb;
679 cb -= Sym.cb;
680 }
681 else
682 {
683 fRc = disByteData(uFlatAddr, cb);
684 uFlatAddr += cb;
685 cb = 0;
686 }
687 if (!fRc)
688 return false;
689 }
690
691 return true;
692}
693
694
695static bool disIsCodeAndAdjustSize(uint32_t uFlatAddr, PRTDBGSYMBOL pSym, PBIOSSEG pSeg)
696{
697 if (!strcmp(pSeg->szName, "BIOSSEG"))
698 {
699 if ( !strcmp(pSym->szName, "rom_fdpt")
700 || !strcmp(pSym->szName, "pmbios_gdt")
701 || !strcmp(pSym->szName, "pmbios_gdt_desc")
702 || !strcmp(pSym->szName, "_pmode_IDT")
703 || !strcmp(pSym->szName, "_rmode_IDT")
704 || !strncmp(pSym->szName, RT_STR_TUPLE("font"))
705 || !strcmp(pSym->szName, "bios_string")
706 || !strcmp(pSym->szName, "vector_table")
707 || !strcmp(pSym->szName, "pci_routing_table_structure")
708 )
709 return false;
710 }
711
712 if (!strcmp(pSym->szName, "cpu_reset"))
713 pSym->cb = RT_MIN(pSym->cb, 5);
714 else if (!strcmp(pSym->szName, "pci_init_end"))
715 pSym->cb = RT_MIN(pSym->cb, 3);
716
717 return true;
718}
719
720
721static bool disIs16BitCode(const char *pszSymbol)
722{
723 return true;
724}
725
726
727/**
728 * Deals with instructions that YASM will assemble differently than WASM/WCC.
729 */
730static size_t disHandleYasmDifferences(PDISCPUSTATE pCpuState, uint32_t uFlatAddr, uint32_t cbInstr,
731 char *pszBuf, size_t cbBuf, size_t cchUsed)
732{
733 bool fDifferent = DISFormatYasmIsOddEncoding(pCpuState);
734 uint8_t const *pb = &g_pbImg[uFlatAddr - VBOX_BIOS_BASE];
735
736 /*
737 * Disassembler bugs.
738 */
739 /** @todo Group 1a and 11 seems to be disassembled incorrectly when
740 * modrm.reg != 0. Those encodings should be invalid AFAICT. */
741
742 if ( ( pCpuState->opcode == 0x8f /* group 1a */
743 || pCpuState->opcode == 0xc7 /* group 11 */
744 || pCpuState->opcode == 0xc6 /* group 11 - not verified */
745 )
746 && pCpuState->ModRM.Bits.Reg != 0)
747 fDifferent = true;
748 /** @todo "TEST Eb,Ib" (f6 0f 08) ends up with no mnemonic as well as
749 * wrong length (2 instead of 3)! */
750 else if ( pCpuState->opcode == 0xf6
751 && pb[1] == 0x0f
752 && pb[2] == 0x08
753 && RT_C_IS_SPACE(*pszBuf) )
754 fDifferent = true;
755 /** @todo "INSB Yb,DX" (6c) ends up with no mnemonic here. */
756 else if (pCpuState->opcode == 0x6c && RT_C_IS_SPACE(*pszBuf))
757 fDifferent = true;
758 /*
759 * Check these out and consider adding them to DISFormatYasmIsOddEncoding.
760 */
761 else if ( pb[0] == 0xf3
762 && pb[1] == 0x66
763 && pb[2] == 0x6d)
764 fDifferent = true; /* rep insd - prefix switched. */
765 else if ( pb[0] == 0xc6
766 && pb[1] == 0xc5
767 && pb[2] == 0xba)
768 fDifferent = true; /* mov ch, 0bah - yasm uses a short sequence: 0xb5 0xba. */
769 /*
770 * Switch table fun (.sym may help):
771 */
772#if 0
773 else if ( pb[0] == 0x64
774 && pb[1] == 0x65
775 && pb[2] == 0x05
776 /*&& pb[3] == 0x61
777 && pb[4] == 0x19*/)
778 fDifferent = true; /* gs add ax, 01961h - both fs and gs prefix. Probably some switch table. */
779 else if ( pb[0] == 0x65
780 && pb[1] == 0x36
781 && pb[2] == 0x65
782 && pb[3] == 0xae)
783 fDifferent = true; /* gs scasb - switch table or smth. */
784 else if ( pb[0] == 0x67
785 && pb[1] == 0xe7
786 /*&& pb[2] == 0x67*/)
787 fDifferent = true; /* out 067h, ax - switch table or smth. */
788#endif
789
790
791 /*
792 * Handle different stuff.
793 */
794 if (fDifferent)
795 {
796 disByteData(uFlatAddr, cbInstr); /* lazy bird. */
797
798 if (cchUsed + 2 < cbBuf)
799 {
800 memmove(pszBuf + 2, pszBuf, cchUsed + 2);
801 cchUsed += 2;
802 }
803
804 pszBuf[0] = ';';
805 pszBuf[1] = ' ';
806 }
807
808 return cchUsed;
809}
810
811
812/**
813 * Disassembler callback for reading opcode bytes.
814 *
815 * @returns VINF_SUCCESS.
816 * @param uFlatAddr The address to read at.
817 * @param pbDst Where to store them.
818 * @param cbToRead How many to read.
819 * @param pvUser Unused.
820 */
821static DECLCALLBACK(int) disReadOpcodeBytes(RTUINTPTR uFlatAddr, uint8_t *pbDst, unsigned cbToRead, void *pvUser)
822{
823 if (uFlatAddr + cbToRead >= VBOX_BIOS_BASE + _64K)
824 {
825 RT_BZERO(pbDst, cbToRead);
826 if (uFlatAddr >= VBOX_BIOS_BASE + _64K)
827 cbToRead = 0;
828 else
829 cbToRead = VBOX_BIOS_BASE + _64K - uFlatAddr;
830 }
831 memcpy(pbDst, &g_pbImg[uFlatAddr - VBOX_BIOS_BASE], cbToRead);
832 NOREF(pvUser);
833 return VINF_SUCCESS;
834}
835
836
837/**
838 * Disassembles code.
839 *
840 * @returns @c true on success, @c false on failure.
841 * @param uFlatAddr The address where the code starts.
842 * @param cb The amount of code to disassemble.
843 * @param fIs16Bit Is is 16-bit (@c true) or 32-bit (@c false).
844 */
845static bool disCode(uint32_t uFlatAddr, uint32_t cb, bool fIs16Bit)
846{
847 uint8_t const *pb = &g_pbImg[uFlatAddr - VBOX_BIOS_BASE];
848
849 while (cb > 0)
850 {
851 /* Trailing zero padding detection. */
852 if ( *pb == '\0'
853 && ASMMemIsAll8(pb, RT_MIN(cb, 8), 0) == NULL)
854 {
855 void *pv = ASMMemIsAll8(pb, cb, 0);
856 uint32_t cbZeros = pv ? (uint32_t)((uint8_t const *)pv - pb) : cb;
857 if (!outputPrintf(" times %#x db 0\n", cbZeros))
858 return false;
859 cb -= cbZeros;
860 pb += cbZeros;
861 uFlatAddr += cbZeros;
862 if ( cb == 2
863 && pb[0] == 'X'
864 && pb[1] == 'M')
865 return disStringData(uFlatAddr, cb);
866 }
867 /* Work arounds for switch tables and such (disas assertions). */
868 else if ( ( pb[0] == 0x11 /* int13_cdemu switch */
869 && pb[1] == 0xda
870 && pb[2] == 0x05
871 && pb[3] == 0xff
872 && pb[4] == 0xff
873 )
874 || 0
875 )
876 return disByteData(uFlatAddr, cb);
877 else
878 {
879 unsigned cbInstr;
880 DISCPUSTATE CpuState;
881 int rc = DISCoreOneEx(uFlatAddr, fIs16Bit ? CPUMODE_16BIT : CPUMODE_32BIT,
882 disReadOpcodeBytes, NULL, &CpuState, &cbInstr);
883 if ( RT_SUCCESS(rc)
884 && cbInstr <= cb)
885 {
886 char szTmp[4096];
887 size_t cch = DISFormatYasmEx(&CpuState, szTmp, sizeof(szTmp),
888 DIS_FMT_FLAGS_STRICT
889 | DIS_FMT_FLAGS_BYTES_RIGHT | DIS_FMT_FLAGS_BYTES_COMMENT | DIS_FMT_FLAGS_BYTES_SPACED,
890 NULL, NULL);
891 cch = disHandleYasmDifferences(&CpuState, uFlatAddr, cbInstr, szTmp, sizeof(szTmp), cch);
892 Assert(cch < sizeof(szTmp));
893
894 if (g_cVerbose > 1)
895 {
896 while (cch < 72)
897 szTmp[cch++] = ' ';
898 RTStrPrintf(&szTmp[cch], sizeof(szTmp) - cch, "; %#x", uFlatAddr);
899 }
900
901 if (!outputPrintf(" %s\n", szTmp))
902 return false;
903 cb -= cbInstr;
904 pb += cbInstr;
905 uFlatAddr += cbInstr;
906 }
907 else
908 {
909 if (!disByteData(uFlatAddr, 1))
910 return false;
911 cb--;
912 pb++;
913 uFlatAddr++;
914 }
915 }
916 }
917 return true;
918}
919
920
921static bool disCodeSegment(uint32_t iSeg)
922{
923 uint32_t uFlatAddr = g_aSegs[iSeg].uFlatAddr;
924 uint32_t cb = g_aSegs[iSeg].cb;
925
926 while (cb > 0)
927 {
928 uint32_t off;
929 RTDBGSYMBOL Sym;
930 disGetNextSymbol(uFlatAddr, cb, &off, &Sym);
931
932 if (off > 0)
933 {
934 if (!disByteData(uFlatAddr, off))
935 return false;
936 cb -= off;
937 uFlatAddr += off;
938 off = 0;
939 if (!cb)
940 break;
941 }
942
943 bool fRc;
944 if (off == 0)
945 {
946 size_t cchName = strlen(Sym.szName);
947 fRc = outputPrintf("%s: %*s; %#x LB %#x\n", Sym.szName, cchName < 41 - 2 ? cchName - 41 - 2 : 0, "", uFlatAddr, Sym.cb);
948 if (!fRc)
949 return false;
950
951 if (disIsCodeAndAdjustSize(uFlatAddr, &Sym, &g_aSegs[iSeg]))
952 fRc = disCode(uFlatAddr, Sym.cb, disIs16BitCode(Sym.szName));
953 else
954 fRc = disByteData(uFlatAddr, Sym.cb);
955
956 uFlatAddr += Sym.cb;
957 cb -= Sym.cb;
958 }
959 else
960 {
961 fRc = disByteData(uFlatAddr, cb);
962 uFlatAddr += cb;
963 cb = 0;
964 }
965 if (!fRc)
966 return false;
967 }
968
969 return true;
970}
971
972
973static RTEXITCODE DisassembleBiosImage(void)
974{
975 if (!outputPrintf(""))
976 return RTEXITCODE_FAILURE;
977
978 /*
979 * Work the image segment by segment.
980 */
981 bool fRc = true;
982 uint32_t uFlatAddr = VBOX_BIOS_BASE;
983 for (uint32_t iSeg = 0; iSeg < g_cSegs && fRc; iSeg++)
984 {
985 /* Is there a gap between the segments? */
986 if (uFlatAddr < g_aSegs[iSeg].uFlatAddr)
987 {
988 fRc = disCopySegmentGap(uFlatAddr, g_aSegs[iSeg].uFlatAddr - uFlatAddr);
989 if (!fRc)
990 break;
991 uFlatAddr = g_aSegs[iSeg].uFlatAddr;
992 }
993 else if (uFlatAddr > g_aSegs[iSeg].uFlatAddr)
994 return RTMsgErrorExit(RTEXITCODE_FAILURE, "Overlapping segments: %u and %u; uFlatAddr=%#x\n", iSeg - 1, iSeg, uFlatAddr);
995
996 /* Disassemble the segment. */
997 fRc = outputPrintf("\n"
998 "section %s progbits vstart=%#x align=1 ; size=%#x class=%s group=%s\n",
999 g_aSegs[iSeg].szName, g_aSegs[iSeg].uFlatAddr - VBOX_BIOS_BASE,
1000 g_aSegs[iSeg].cb, g_aSegs[iSeg].szClass, g_aSegs[iSeg].szGroup);
1001 if (!fRc)
1002 return RTEXITCODE_FAILURE;
1003 if (!strcmp(g_aSegs[iSeg].szName, "CONST"))
1004 fRc = disConstSegment(iSeg);
1005 else if (!strcmp(g_aSegs[iSeg].szClass, "DATA"))
1006 fRc = disDataSegment(iSeg);
1007 else
1008 fRc = disCodeSegment(iSeg);
1009
1010 /* Advance. */
1011 uFlatAddr += g_aSegs[iSeg].cb;
1012 }
1013
1014 /* Final gap. */
1015 if (uFlatAddr < VBOX_BIOS_BASE + _64K)
1016 fRc = disCopySegmentGap(uFlatAddr, VBOX_BIOS_BASE + _64K - uFlatAddr);
1017 else if (uFlatAddr > VBOX_BIOS_BASE + _64K)
1018 return RTMsgErrorExit(RTEXITCODE_FAILURE, "Last segment spills beyond 1MB; uFlatAddr=%#x\n", uFlatAddr);
1019
1020 if (!fRc)
1021 return RTEXITCODE_FAILURE;
1022 return RTEXITCODE_SUCCESS;
1023}
1024
1025
1026
1027/**
1028 * Parses the symbol file for the BIOS.
1029 *
1030 * This is in ELF/DWARF format.
1031 *
1032 * @returns RTEXITCODE_SUCCESS or RTEXITCODE_FAILURE+msg.
1033 * @param pszBiosSym Path to the sym file.
1034 */
1035static RTEXITCODE ParseSymFile(const char *pszBiosSym)
1036{
1037 /** @todo use RTDbg* later. (Just checking for existance currently.) */
1038 PRTSTREAM hStrm;
1039 int rc = RTStrmOpen(pszBiosSym, "rb", &hStrm);
1040 if (RT_FAILURE(rc))
1041 return RTMsgErrorExit(RTEXITCODE_FAILURE, "Error opening '%s': %Rrc", pszBiosSym, rc);
1042 RTStrmClose(hStrm);
1043 return RTEXITCODE_SUCCESS;
1044}
1045
1046
1047/**
1048 * Reads a line from the file.
1049 *
1050 * @returns @c true on success, @c false + msg on failure, @c false on eof.
1051 * @param pMap The map file handle.
1052 */
1053static bool mapReadLine(PBIOSMAP pMap)
1054{
1055 int rc = RTStrmGetLine(pMap->hStrm, pMap->szLine, sizeof(pMap->szLine));
1056 if (RT_FAILURE(rc))
1057 {
1058 if (rc == VERR_EOF)
1059 {
1060 pMap->fEof = true;
1061 pMap->cch = 0;
1062 pMap->offNW = 0;
1063 pMap->szLine[0] = '\0';
1064 }
1065 else
1066 RTMsgError("%s:%d: Read error %Rrc", pMap->pszMapFile, pMap->iLine + 1, rc);
1067 return false;
1068 }
1069 pMap->iLine++;
1070 pMap->cch = (uint32_t)strlen(pMap->szLine);
1071
1072 /* Check out leading white space. */
1073 if (!RT_C_IS_SPACE(pMap->szLine[0]))
1074 pMap->offNW = 0;
1075 else
1076 {
1077 uint32_t off = 1;
1078 while (RT_C_IS_SPACE(pMap->szLine[off]))
1079 off++;
1080 pMap->offNW = off;
1081 }
1082
1083 return true;
1084}
1085
1086
1087/**
1088 * Checks if it is an empty line.
1089 * @returns @c true if empty, @c false if not.
1090 * @param pMap The map file handle.
1091 */
1092static bool mapIsEmptyLine(PBIOSMAP pMap)
1093{
1094 Assert(pMap->offNW <= pMap->cch);
1095 return pMap->offNW == pMap->cch;
1096}
1097
1098
1099/**
1100 * Reads ahead in the map file until a non-empty line or EOF is encountered.
1101 *
1102 * @returns @c true on success, @c false + msg on failure, @c false on eof.
1103 * @param pMap The map file handle.
1104 */
1105static bool mapSkipEmptyLines(PBIOSMAP pMap)
1106{
1107 for (;;)
1108 {
1109 if (!mapReadLine(pMap))
1110 return false;
1111 if (pMap->offNW < pMap->cch)
1112 return true;
1113 }
1114}
1115
1116
1117/**
1118 * Reads ahead in the map file until an empty line or EOF is encountered.
1119 *
1120 * @returns @c true on success, @c false + msg on failure, @c false on eof.
1121 * @param pMap The map file handle.
1122 */
1123static bool mapSkipNonEmptyLines(PBIOSMAP pMap)
1124{
1125 for (;;)
1126 {
1127 if (!mapReadLine(pMap))
1128 return false;
1129 if (pMap->offNW == pMap->cch)
1130 return true;
1131 }
1132}
1133
1134
1135/**
1136 * Strips the current line.
1137 *
1138 * The string length may change.
1139 *
1140 * @returns Pointer to the first non-space character.
1141 * @param pMap The map file handle.
1142 * @param pcch Where to return the length of the unstripped
1143 * part. Optional.
1144 */
1145static char *mapStripCurrentLine(PBIOSMAP pMap, size_t *pcch)
1146{
1147 char *psz = &pMap->szLine[pMap->offNW];
1148 char *pszEnd = &pMap->szLine[pMap->cch];
1149 while ( (uintptr_t)pszEnd > (uintptr_t)psz
1150 && RT_C_IS_SPACE(pszEnd[-1]))
1151 {
1152 *--pszEnd = '\0';
1153 pMap->cch--;
1154 }
1155 if (pcch)
1156 *pcch = pszEnd - psz;
1157 return psz;
1158}
1159
1160
1161/**
1162 * Reads a line from the file and right strips it.
1163 *
1164 * @returns Pointer to szLine on success, @c NULL + msg on failure, @c NULL on
1165 * EOF.
1166 * @param pMap The map file handle.
1167 * @param pcch Where to return the length of the unstripped
1168 * part. Optional.
1169 */
1170static char *mapReadLineStripRight(PBIOSMAP pMap, size_t *pcch)
1171{
1172 if (!mapReadLine(pMap))
1173 return NULL;
1174 mapStripCurrentLine(pMap, NULL);
1175 if (pcch)
1176 *pcch = pMap->cch;
1177 return pMap->szLine;
1178}
1179
1180
1181/**
1182 * mapReadLine() + mapStripCurrentLine().
1183 *
1184 * @returns Pointer to the first non-space character in the new line. NULL on
1185 * read error (bitched already) or end of file.
1186 * @param pMap The map file handle.
1187 * @param pcch Where to return the length of the unstripped
1188 * part. Optional.
1189 */
1190static char *mapReadLineStrip(PBIOSMAP pMap, size_t *pcch)
1191{
1192 if (!mapReadLine(pMap))
1193 return NULL;
1194 return mapStripCurrentLine(pMap, pcch);
1195}
1196
1197
1198/**
1199 * Parses a word, copying it into the supplied buffer, and skipping any spaces
1200 * following it.
1201 *
1202 * @returns @c true on success, @c false on failure.
1203 * @param ppszCursor Pointer to the cursor variable.
1204 * @param pszBuf The output buffer.
1205 * @param cbBuf The size of the output buffer.
1206 */
1207static bool mapParseWord(char **ppszCursor, char *pszBuf, size_t cbBuf)
1208{
1209 /* Check that we start on a non-blank. */
1210 char *pszStart = *ppszCursor;
1211 if (!*pszStart || RT_C_IS_SPACE(*pszStart))
1212 return false;
1213
1214 /* Find the end of the word. */
1215 char *psz = pszStart + 1;
1216 while (*psz && !RT_C_IS_SPACE(*psz))
1217 psz++;
1218
1219 /* Copy it. */
1220 size_t cchWord = (uintptr_t)psz - (uintptr_t)pszStart;
1221 if (cchWord >= cbBuf)
1222 return false;
1223 memcpy(pszBuf, pszStart, cchWord);
1224 pszBuf[cchWord] = '\0';
1225
1226 /* Skip blanks following it. */
1227 while (RT_C_IS_SPACE(*psz))
1228 psz++;
1229 *ppszCursor = psz;
1230 return true;
1231}
1232
1233
1234/**
1235 * Parses an 16:16 address.
1236 *
1237 * @returns @c true on success, @c false on failure.
1238 * @param ppszCursor Pointer to the cursor variable.
1239 * @param pAddr Where to return the address.
1240 */
1241static bool mapParseAddress(char **ppszCursor, PRTFAR16 pAddr)
1242{
1243 char szWord[32];
1244 if (!mapParseWord(ppszCursor, szWord, sizeof(szWord)))
1245 return false;
1246 size_t cchWord = strlen(szWord);
1247
1248 /* An address is at least 16:16 format. It may be 16:32. It may also be flagged. */
1249 size_t cchAddr = 4 + 1 + 4;
1250 if (cchWord < cchAddr)
1251 return false;
1252 if ( !RT_C_IS_XDIGIT(szWord[0])
1253 || !RT_C_IS_XDIGIT(szWord[1])
1254 || !RT_C_IS_XDIGIT(szWord[2])
1255 || !RT_C_IS_XDIGIT(szWord[3])
1256 || szWord[4] != ':'
1257 || !RT_C_IS_XDIGIT(szWord[5])
1258 || !RT_C_IS_XDIGIT(szWord[6])
1259 || !RT_C_IS_XDIGIT(szWord[7])
1260 || !RT_C_IS_XDIGIT(szWord[8])
1261 )
1262 return false;
1263 if ( cchWord > cchAddr
1264 && RT_C_IS_XDIGIT(szWord[9])
1265 && RT_C_IS_XDIGIT(szWord[10])
1266 && RT_C_IS_XDIGIT(szWord[11])
1267 && RT_C_IS_XDIGIT(szWord[12]))
1268 cchAddr += 4;
1269
1270 /* Drop flag if present. */
1271 if (cchWord > cchAddr)
1272 {
1273 if (RT_C_IS_XDIGIT(szWord[4+1+4]))
1274 return false;
1275 szWord[cchAddr] = '\0';
1276 cchWord = cchAddr;
1277 }
1278
1279 /* Convert it. */
1280 szWord[4] = '\0';
1281 int rc1 = RTStrToUInt16Full(szWord, 16, &pAddr->sel);
1282 if (rc1 != VINF_SUCCESS)
1283 return false;
1284
1285 int rc2 = RTStrToUInt16Full(szWord + 5, 16, &pAddr->off);
1286 if (rc2 != VINF_SUCCESS)
1287 return false;
1288 return true;
1289}
1290
1291
1292/**
1293 * Parses a size.
1294 *
1295 * @returns @c true on success, @c false on failure.
1296 * @param ppszCursor Pointer to the cursor variable.
1297 * @param pcb Where to return the size.
1298 */
1299static bool mapParseSize(char **ppszCursor, uint32_t *pcb)
1300{
1301 char szWord[32];
1302 if (!mapParseWord(ppszCursor, szWord, sizeof(szWord)))
1303 return false;
1304 size_t cchWord = strlen(szWord);
1305 if (cchWord != 8)
1306 return false;
1307
1308 int rc = RTStrToUInt32Full(szWord, 16, pcb);
1309 if (rc != VINF_SUCCESS)
1310 return false;
1311 return true;
1312}
1313
1314
1315/**
1316 * Parses a section box and the following column header.
1317 *
1318 * @returns @c true on success, @c false + msg on failure, @c false on eof.
1319 * @param pMap Map file handle.
1320 * @param pszSectionNm The expected section name.
1321 * @param cColumns The number of columns.
1322 * @param ... The column names.
1323 */
1324static bool mapSkipThruColumnHeadings(PBIOSMAP pMap, const char *pszSectionNm, uint32_t cColumns, ...)
1325{
1326 if ( mapIsEmptyLine(pMap)
1327 && !mapSkipEmptyLines(pMap))
1328 return false;
1329
1330 /* +------------+ */
1331 size_t cch;
1332 char *psz = mapStripCurrentLine(pMap, &cch);
1333 if (!psz)
1334 return false;
1335
1336 if ( psz[0] != '+'
1337 || psz[1] != '-'
1338 || psz[2] != '-'
1339 || psz[3] != '-'
1340 || psz[cch - 4] != '-'
1341 || psz[cch - 3] != '-'
1342 || psz[cch - 2] != '-'
1343 || psz[cch - 1] != '+'
1344 )
1345 {
1346 RTMsgError("%s:%d: Expected section box: +-----...", pMap->pszMapFile, pMap->iLine);
1347 return false;
1348 }
1349
1350 /* | pszSectionNm | */
1351 psz = mapReadLineStrip(pMap, &cch);
1352 if (!psz)
1353 return false;
1354
1355 size_t cchSectionNm = strlen(pszSectionNm);
1356 if ( psz[0] != '|'
1357 || psz[1] != ' '
1358 || psz[2] != ' '
1359 || psz[3] != ' '
1360 || psz[cch - 4] != ' '
1361 || psz[cch - 3] != ' '
1362 || psz[cch - 2] != ' '
1363 || psz[cch - 1] != '|'
1364 || cch != 1 + 3 + cchSectionNm + 3 + 1
1365 || strncmp(&psz[4], pszSectionNm, cchSectionNm)
1366 )
1367 {
1368 RTMsgError("%s:%d: Expected section box: | %s |", pMap->pszMapFile, pMap->iLine, pszSectionNm);
1369 return false;
1370 }
1371
1372 /* +------------+ */
1373 psz = mapReadLineStrip(pMap, &cch);
1374 if (!psz)
1375 return false;
1376 if ( psz[0] != '+'
1377 || psz[1] != '-'
1378 || psz[2] != '-'
1379 || psz[3] != '-'
1380 || psz[cch - 4] != '-'
1381 || psz[cch - 3] != '-'
1382 || psz[cch - 2] != '-'
1383 || psz[cch - 1] != '+'
1384 )
1385 {
1386 RTMsgError("%s:%d: Expected section box: +-----...", pMap->pszMapFile, pMap->iLine);
1387 return false;
1388 }
1389
1390 /* There may be a few lines describing the table notation now, surrounded by blank lines. */
1391 do
1392 {
1393 psz = mapReadLineStripRight(pMap, &cch);
1394 if (!psz)
1395 return false;
1396 } while ( *psz == '\0'
1397 || ( !RT_C_IS_SPACE(psz[0])
1398 && RT_C_IS_SPACE(psz[1])
1399 && psz[2] == '='
1400 && RT_C_IS_SPACE(psz[3]))
1401 );
1402
1403 /* Should have the column heading now. */
1404 va_list va;
1405 va_start(va, cColumns);
1406 for (uint32_t i = 0; i < cColumns; i++)
1407 {
1408 const char *pszColumn = va_arg(va, const char *);
1409 size_t cchColumn = strlen(pszColumn);
1410 if ( strncmp(psz, pszColumn, cchColumn)
1411 || ( psz[cchColumn] != '\0'
1412 && !RT_C_IS_SPACE(psz[cchColumn])))
1413 {
1414 va_end(va);
1415 RTMsgError("%s:%d: Expected column '%s' found '%s'", pMap->pszMapFile, pMap->iLine, pszColumn, psz);
1416 return false;
1417 }
1418 psz += cchColumn;
1419 while (RT_C_IS_SPACE(*psz))
1420 psz++;
1421 }
1422 va_end(va);
1423
1424 /* The next line is the underlining. */
1425 psz = mapReadLineStripRight(pMap, &cch);
1426 if (!psz)
1427 return false;
1428 if (*psz != '=' || psz[cch - 1] != '=')
1429 {
1430 RTMsgError("%s:%d: Expected column header underlining", pMap->pszMapFile, pMap->iLine);
1431 return false;
1432 }
1433
1434 /* Skip one blank line. */
1435 psz = mapReadLineStripRight(pMap, &cch);
1436 if (!psz)
1437 return false;
1438 if (*psz)
1439 {
1440 RTMsgError("%s:%d: Expected blank line beneath the column headers", pMap->pszMapFile, pMap->iLine);
1441 return false;
1442 }
1443
1444 return true;
1445}
1446
1447
1448/**
1449 * Parses a segment list.
1450 *
1451 * @returns @c true on success, @c false + msg on failure, @c false on eof.
1452 * @param pMap The map file handle.
1453 */
1454static bool mapParseSegments(PBIOSMAP pMap)
1455{
1456 for (;;)
1457 {
1458 if (!mapReadLineStripRight(pMap, NULL))
1459 return false;
1460
1461 /* The end? The line should be empty. Expectes segment name to not
1462 start with a space. */
1463 if (!pMap->szLine[0] || RT_C_IS_SPACE(pMap->szLine[0]))
1464 {
1465 if (!pMap->szLine[0])
1466 return true;
1467 RTMsgError("%s:%u: Malformed segment line", pMap->pszMapFile, pMap->iLine);
1468 return false;
1469 }
1470
1471 /* Parse the segment line. */
1472 uint32_t iSeg = g_cSegs;
1473 if (iSeg >= RT_ELEMENTS(g_aSegs))
1474 {
1475 RTMsgError("%s:%u: Too many segments", pMap->pszMapFile, pMap->iLine);
1476 return false;
1477 }
1478
1479 char *psz = pMap->szLine;
1480 if (!mapParseWord(&psz, g_aSegs[iSeg].szName, sizeof(g_aSegs[iSeg].szName)))
1481 RTMsgError("%s:%u: Segment name parser error", pMap->pszMapFile, pMap->iLine);
1482 else if (!mapParseWord(&psz, g_aSegs[iSeg].szClass, sizeof(g_aSegs[iSeg].szClass)))
1483 RTMsgError("%s:%u: Segment class parser error", pMap->pszMapFile, pMap->iLine);
1484 else if (!mapParseWord(&psz, g_aSegs[iSeg].szGroup, sizeof(g_aSegs[iSeg].szGroup)))
1485 RTMsgError("%s:%u: Segment group parser error", pMap->pszMapFile, pMap->iLine);
1486 else if (!mapParseAddress(&psz, &g_aSegs[iSeg].Address))
1487 RTMsgError("%s:%u: Segment address parser error", pMap->pszMapFile, pMap->iLine);
1488 else if (!mapParseSize(&psz, &g_aSegs[iSeg].cb))
1489 RTMsgError("%s:%u: Segment size parser error", pMap->pszMapFile, pMap->iLine);
1490 else
1491 {
1492 g_aSegs[iSeg].uFlatAddr = ((uint32_t)g_aSegs[iSeg].Address.sel << 4) + g_aSegs[iSeg].Address.off;
1493 g_cSegs++;
1494 if (g_cVerbose > 2)
1495 RTStrmPrintf(g_pStdErr, "read segment at %08x / %04x:%04x LB %04x %s / %s / %s\n",
1496 g_aSegs[iSeg].uFlatAddr,
1497 g_aSegs[iSeg].Address.sel,
1498 g_aSegs[iSeg].Address.off,
1499 g_aSegs[iSeg].cb,
1500 g_aSegs[iSeg].szName,
1501 g_aSegs[iSeg].szClass,
1502 g_aSegs[iSeg].szGroup);
1503
1504 while (RT_C_IS_SPACE(*psz))
1505 psz++;
1506 if (!*psz)
1507 continue;
1508 RTMsgError("%s:%u: Junk at end of line", pMap->pszMapFile, pMap->iLine);
1509 }
1510 return false;
1511 }
1512}
1513
1514
1515/**
1516 * Sorts the segment array by flat address and adds them to the debug module.
1517 *
1518 * @returns @c true on success, @c false + msg on failure, @c false on eof.
1519 */
1520static bool mapSortAndAddSegments(void)
1521{
1522 for (uint32_t i = 0; i < g_cSegs; i++)
1523 {
1524 for (uint32_t j = i + 1; j < g_cSegs; j++)
1525 if (g_aSegs[j].uFlatAddr < g_aSegs[i].uFlatAddr)
1526 {
1527 BIOSSEG Tmp = g_aSegs[i];
1528 g_aSegs[i] = g_aSegs[j];
1529 g_aSegs[j] = Tmp;
1530 }
1531 if (g_cVerbose > 0)
1532 RTStrmPrintf(g_pStdErr, "segment at %08x / %04x:%04x LB %04x %s / %s / %s\n",
1533 g_aSegs[i].uFlatAddr,
1534 g_aSegs[i].Address.sel,
1535 g_aSegs[i].Address.off,
1536 g_aSegs[i].cb,
1537 g_aSegs[i].szName,
1538 g_aSegs[i].szClass,
1539 g_aSegs[i].szGroup);
1540
1541 RTDBGSEGIDX idx = i;
1542 int rc = RTDbgModSegmentAdd(g_hMapMod, g_aSegs[i].uFlatAddr, g_aSegs[i].cb, g_aSegs[i].szName, 0 /*fFlags*/, &idx);
1543 if (RT_FAILURE(rc))
1544 {
1545 RTMsgError("RTDbgModSegmentAdd failed on %s: %Rrc", g_aSegs[i].szName);
1546 return false;
1547 }
1548 }
1549 return true;
1550}
1551
1552
1553/**
1554 * Parses a segment list.
1555 *
1556 * @returns @c true on success, @c false + msg on failure, @c false on eof.
1557 * @param pMap The map file handle.
1558 */
1559static bool mapParseSymbols(PBIOSMAP pMap)
1560{
1561 for (;;)
1562 {
1563 if (!mapReadLineStripRight(pMap, NULL))
1564 return false;
1565
1566 /* The end? The line should be empty. Expectes segment name to not
1567 start with a space. */
1568 if (!pMap->szLine[0] || RT_C_IS_SPACE(pMap->szLine[0]))
1569 {
1570 if (!pMap->szLine[0])
1571 return true;
1572 RTMsgError("%s:%u: Malformed symbol line", pMap->pszMapFile, pMap->iLine);
1573 return false;
1574 }
1575
1576 /* Skip the module name lines for now. */
1577 if (!strncmp(pMap->szLine, RT_STR_TUPLE("Module: ")))
1578 continue;
1579
1580 /* Parse the segment line. */
1581 char szName[4096];
1582 RTFAR16 Addr;
1583 char *psz = pMap->szLine;
1584 if (!mapParseAddress(&psz, &Addr))
1585 RTMsgError("%s:%u: Symbol address parser error", pMap->pszMapFile, pMap->iLine);
1586 else if (!mapParseWord(&psz, szName, sizeof(szName)))
1587 RTMsgError("%s:%u: Symbol name parser error", pMap->pszMapFile, pMap->iLine);
1588 else
1589 {
1590 uint32_t uFlatAddr = ((uint32_t)Addr.sel << 4) + Addr.off;
1591 if (uFlatAddr == 0)
1592 continue;
1593
1594 int rc = RTDbgModSymbolAdd(g_hMapMod, szName, RTDBGSEGIDX_RVA, uFlatAddr, 0 /*cb*/, 0 /*fFlags*/, NULL);
1595 if (RT_SUCCESS(rc) || rc == VERR_DBG_ADDRESS_CONFLICT)
1596 {
1597
1598 if (g_cVerbose > 2)
1599 RTStrmPrintf(g_pStdErr, "read symbol - %08x %s\n", uFlatAddr, szName);
1600 while (RT_C_IS_SPACE(*psz))
1601 psz++;
1602 if (!*psz)
1603 continue;
1604 RTMsgError("%s:%u: Junk at end of line", pMap->pszMapFile, pMap->iLine);
1605 }
1606 else
1607 RTMsgError("%s:%u: RTDbgModSymbolAdd failed: %Rrc", pMap->pszMapFile, pMap->iLine, rc);
1608 }
1609 return false;
1610 }
1611}
1612
1613
1614/**
1615 * Parses the given map file.
1616 *
1617 * @returns RTEXITCODE_SUCCESS and lots of globals, or RTEXITCODE_FAILURE and a
1618 * error message.
1619 * @param pMap The map file handle.
1620 */
1621static RTEXITCODE mapParseFile(PBIOSMAP pMap)
1622{
1623 int rc = RTDbgModCreate(&g_hMapMod, "VBoxBios", 0 /*cbSeg*/, 0 /*fFlags*/);
1624 if (RT_FAILURE(rc))
1625 return RTMsgErrorExit(RTEXITCODE_FAILURE, "RTDbgModCreate failed: %Rrc", rc);
1626
1627 /*
1628 * Read the header.
1629 */
1630 if (!mapReadLine(pMap))
1631 return RTEXITCODE_FAILURE;
1632 if (strncmp(pMap->szLine, RT_STR_TUPLE("Open Watcom Linker Version")))
1633 return RTMsgErrorExit(RTEXITCODE_FAILURE, "Unexpected map-file header: '%s'", pMap->szLine);
1634 if ( !mapSkipNonEmptyLines(pMap)
1635 || !mapSkipEmptyLines(pMap))
1636 return RTEXITCODE_FAILURE;
1637
1638 /*
1639 * Skip groups.
1640 */
1641 if (!mapSkipThruColumnHeadings(pMap, "Groups", 3, "Group", "Address", "Size", NULL))
1642 return RTEXITCODE_FAILURE;
1643 if (!mapSkipNonEmptyLines(pMap))
1644 return RTEXITCODE_FAILURE;
1645
1646 /*
1647 * Parse segments.
1648 */
1649 if (!mapSkipThruColumnHeadings(pMap, "Segments", 5, "Segment", "Class", "Group", "Address", "Size"))
1650 return RTEXITCODE_FAILURE;
1651 if (!mapParseSegments(pMap))
1652 return RTEXITCODE_FAILURE;
1653 if (!mapSortAndAddSegments())
1654 return RTEXITCODE_FAILURE;
1655
1656 /*
1657 * Parse symbols.
1658 */
1659 if (!mapSkipThruColumnHeadings(pMap, "Memory Map", 2, "Address", "Symbol"))
1660 return RTEXITCODE_FAILURE;
1661 if (!mapParseSymbols(pMap))
1662 return RTEXITCODE_FAILURE;
1663
1664 /* Ignore the rest of the file. */
1665 return RTEXITCODE_SUCCESS;
1666}
1667
1668
1669/**
1670 * Parses the linker map file for the BIOS.
1671 *
1672 * This is generated by the Watcom linker.
1673 *
1674 * @returns RTEXITCODE_SUCCESS or RTEXITCODE_FAILURE+msg.
1675 * @param pszBiosMap Path to the map file.
1676 */
1677static RTEXITCODE ParseMapFile(const char *pszBiosMap)
1678{
1679 BIOSMAP Map;
1680 Map.pszMapFile = pszBiosMap;
1681 Map.hStrm = NULL;
1682 Map.iLine = 0;
1683 Map.fEof = false;
1684 Map.cch = 0;
1685 Map.offNW = 0;
1686 int rc = RTStrmOpen(pszBiosMap, "r", &Map.hStrm);
1687 if (RT_FAILURE(rc))
1688 return RTMsgErrorExit(RTEXITCODE_FAILURE, "Error opening '%s': %Rrc", pszBiosMap, rc);
1689 RTEXITCODE rcExit = mapParseFile(&Map);
1690 RTStrmClose(Map.hStrm);
1691 return rcExit;
1692}
1693
1694
1695/**
1696 * Reads the BIOS image into memory (g_pbImg and g_cbImg).
1697 *
1698 * @returns RTEXITCODE_SUCCESS or RTEXITCODE_FAILURE+msg.
1699 * @param pszBiosImg Path to the image file.
1700 */
1701static RTEXITCODE ReadBiosImage(const char *pszBiosImg)
1702{
1703 void *pvImg;
1704 size_t cbImg;
1705 int rc = RTFileReadAll(pszBiosImg, &pvImg, &cbImg);
1706 if (RT_FAILURE(rc))
1707 return RTMsgErrorExit(RTEXITCODE_FAILURE, "Error reading '%s': %Rrc", pszBiosImg, rc);
1708 if (cbImg != _64K)
1709 {
1710 RTFileReadAllFree(pvImg, cbImg);
1711 return RTMsgErrorExit(RTEXITCODE_FAILURE, "The BIOS image %u bytes intead of 64KB", cbImg);
1712 }
1713
1714 g_pbImg = (uint8_t *)pvImg;
1715 g_cbImg = cbImg;
1716 return RTEXITCODE_SUCCESS;
1717}
1718
1719
1720int main(int argc, char **argv)
1721{
1722 int rc = RTR3InitExe(argc, &argv, 0);
1723 if (RT_FAILURE(rc))
1724 return RTMsgInitFailure(rc);
1725
1726 /*
1727 * Option config.
1728 */
1729 static RTGETOPTDEF const s_aOpts[] =
1730 {
1731 { "--bios-image", 'i', RTGETOPT_REQ_STRING },
1732 { "--bios-map", 'm', RTGETOPT_REQ_STRING },
1733 { "--bios-sym", 's', RTGETOPT_REQ_STRING },
1734 { "--output", 'o', RTGETOPT_REQ_STRING },
1735 { "--verbose", 'v', RTGETOPT_REQ_NOTHING },
1736 { "--quiet", 'q', RTGETOPT_REQ_NOTHING },
1737 };
1738
1739 const char *pszBiosMap = NULL;
1740 const char *pszBiosSym = NULL;
1741 const char *pszBiosImg = NULL;
1742 const char *pszOutput = NULL;
1743
1744 RTGETOPTUNION ValueUnion;
1745 RTGETOPTSTATE GetOptState;
1746 rc = RTGetOptInit(&GetOptState, argc, argv, &s_aOpts[0], RT_ELEMENTS(s_aOpts), 1, RTGETOPTINIT_FLAGS_OPTS_FIRST);
1747 AssertReleaseRCReturn(rc, RTEXITCODE_FAILURE);
1748
1749 /*
1750 * Process the options.
1751 */
1752 while ((rc = RTGetOpt(&GetOptState, &ValueUnion)) != 0)
1753 {
1754 switch (rc)
1755 {
1756 case 'i':
1757 if (pszBiosImg)
1758 return RTMsgErrorExit(RTEXITCODE_SYNTAX, "--bios-image is given more than once");
1759 pszBiosImg = ValueUnion.psz;
1760 break;
1761
1762 case 'm':
1763 if (pszBiosMap)
1764 return RTMsgErrorExit(RTEXITCODE_SYNTAX, "--bios-map is given more than once");
1765 pszBiosMap = ValueUnion.psz;
1766 break;
1767
1768 case 's':
1769 if (pszBiosSym)
1770 return RTMsgErrorExit(RTEXITCODE_SYNTAX, "--bios-sym is given more than once");
1771 pszBiosSym = ValueUnion.psz;
1772 break;
1773
1774 case 'o':
1775 if (pszOutput)
1776 return RTMsgErrorExit(RTEXITCODE_SYNTAX, "--output is given more than once");
1777 pszOutput = ValueUnion.psz;
1778 break;
1779
1780 case 'v':
1781 g_cVerbose++;
1782 break;
1783
1784 case 'q':
1785 g_cVerbose = 0;
1786 break;
1787
1788 case 'H':
1789 RTPrintf("usage: %Rbn --bios-image <file.img> --bios-map <file.map> [--output <file.asm>]\n",
1790 argv[0]);
1791 return RTEXITCODE_SUCCESS;
1792
1793 case 'V':
1794 {
1795 /* The following is assuming that svn does it's job here. */
1796 RTPrintf("r%u\n", RTBldCfgRevision());
1797 return RTEXITCODE_SUCCESS;
1798 }
1799
1800 default:
1801 return RTGetOptPrintError(rc, &ValueUnion);
1802 }
1803 }
1804
1805 /*
1806 * Got it all?
1807 */
1808 if (!pszBiosImg)
1809 return RTMsgErrorExit(RTEXITCODE_SYNTAX, "--bios-image is required");
1810 if (!pszBiosMap)
1811 return RTMsgErrorExit(RTEXITCODE_SYNTAX, "--bios-map is required");
1812 if (!pszBiosSym)
1813 return RTMsgErrorExit(RTEXITCODE_SYNTAX, "--bios-sym is required");
1814
1815 /*
1816 * Do the job.
1817 */
1818 RTEXITCODE rcExit;
1819 rcExit = ReadBiosImage(pszBiosImg);
1820 if (rcExit == RTEXITCODE_SUCCESS)
1821 rcExit = ParseMapFile(pszBiosMap);
1822 if (rcExit == RTEXITCODE_SUCCESS)
1823 rcExit = ParseSymFile(pszBiosSym);
1824 if (rcExit == RTEXITCODE_SUCCESS)
1825 rcExit = OpenOutputFile(pszOutput);
1826 if (rcExit == RTEXITCODE_SUCCESS)
1827 rcExit = DisassembleBiosImage();
1828
1829 return rcExit;
1830}
1831
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette