VirtualBox

source: vbox/trunk/src/VBox/Devices/PC/BIOS-new/MakeDebianBiosAssembly.cpp@ 41668

Last change on this file since 41668 was 41668, checked in by vboxsync, 13 years ago

DIS,DIS-users: Drop the operand/parameter formatting during instruction parsing. The desired formatter can do this afterwards if desired. Should save time + size. (DISCPUSTATE is now 256 bytes here on 64-bit linux, was ~406 yesterday.)

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 57.0 KB
Line 
1/* $Id: MakeDebianBiosAssembly.cpp 41668 2012-06-12 13:15:51Z vboxsync $ */
2/** @file
3 * MakeDebianBiosAssembly - Generate Assembly Source for Debian-minded Distros.
4 */
5
6/*
7 * Copyright (C) 2012 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 */
17
18
19/*******************************************************************************
20* Header Files *
21*******************************************************************************/
22#include <iprt/asm.h>
23#include <iprt/buildconfig.h>
24#include <iprt/ctype.h>
25#include <iprt/dbg.h>
26#include <iprt/file.h>
27#include <iprt/getopt.h>
28#include <iprt/initterm.h>
29#include <iprt/list.h>
30#include <iprt/mem.h>
31#include <iprt/message.h>
32#include <iprt/string.h>
33#include <iprt/stream.h>
34#include <iprt/x86.h>
35
36#include <VBox/dis.h>
37
38
39/*******************************************************************************
40* Defined Constants And Macros *
41*******************************************************************************/
42/** The flat ROM base address. */
43#define VBOX_BIOS_BASE UINT32_C(0xf0000)
44
45
46/*******************************************************************************
47* Structures and Typedefs *
48*******************************************************************************/
49/**
50 * A BIOS segment.
51 */
52typedef struct BIOSSEG
53{
54 char szName[32];
55 char szClass[32];
56 char szGroup[32];
57 RTFAR16 Address;
58 uint32_t uFlatAddr;
59 uint32_t cb;
60} BIOSSEG;
61/** Pointer to a BIOS segment. */
62typedef BIOSSEG *PBIOSSEG;
63
64
65/**
66 * A BIOS object file.
67 */
68typedef struct BIOSOBJFILE
69{
70 RTLISTNODE Node;
71 char *pszSource;
72 char *pszObject;
73} BIOSOBJFILE;
74/** A BIOS object file. */
75typedef BIOSOBJFILE *PBIOSOBJFILE;
76
77
78/**
79 * Pointer to a BIOS map parser handle.
80 */
81typedef struct BIOSMAP
82{
83 /** The stream pointer. */
84 PRTSTREAM hStrm;
85 /** The file name. */
86 const char *pszMapFile;
87 /** Set when EOF has been reached. */
88 bool fEof;
89 /** The current line number (0 based).*/
90 uint32_t iLine;
91 /** The length of the current line. */
92 uint32_t cch;
93 /** The offset of the first non-white character on the line. */
94 uint32_t offNW;
95 /** The line buffer. */
96 char szLine[16384];
97} BIOSMAP;
98/** Pointer to a BIOS map parser handle. */
99typedef BIOSMAP *PBIOSMAP;
100
101
102/*******************************************************************************
103* Global Variables *
104*******************************************************************************/
105static unsigned g_cVerbose = 1 /*0*/;
106/** Pointer to the BIOS image. */
107static uint8_t const *g_pbImg;
108/** The size of the BIOS image. */
109static size_t g_cbImg;
110
111/** Debug module for the map file. */
112static RTDBGMOD g_hMapMod = NIL_RTDBGMOD;
113/** The number of BIOS segments found in the map file. */
114static uint32_t g_cSegs = 0;
115/** Array of BIOS segments from the map file. */
116static BIOSSEG g_aSegs[32];
117/** List of BIOSOBJFILE. */
118static RTLISTANCHOR g_ObjList;
119
120/** The output stream. */
121static PRTSTREAM g_hStrmOutput = NULL;
122
123
124static bool outputPrintfV(const char *pszFormat, va_list va)
125{
126 int rc = RTStrmPrintfV(g_hStrmOutput, pszFormat, va);
127 if (RT_FAILURE(rc))
128 {
129 RTMsgError("Output error: %Rrc\n", rc);
130 return false;
131 }
132 return true;
133}
134
135
136static bool outputPrintf(const char *pszFormat, ...)
137{
138 va_list va;
139 va_start(va, pszFormat);
140 bool fRc = outputPrintfV(pszFormat, va);
141 va_end(va);
142 return fRc;
143}
144
145
146/**
147 * Opens the output file for writing.
148 *
149 * @returns RTEXITCODE_SUCCESS or RTEXITCODE_FAILURE+msg.
150 * @param pszOutput Path to the output file.
151 */
152static RTEXITCODE OpenOutputFile(const char *pszOutput)
153{
154 if (!pszOutput)
155 g_hStrmOutput = g_pStdOut;
156 else
157 {
158 int rc = RTStrmOpen(pszOutput, "w", &g_hStrmOutput);
159 if (RT_FAILURE(rc))
160 return RTMsgErrorExit(RTEXITCODE_FAILURE, "Failed to open output file '%s': %Rrc", pszOutput, rc);
161 }
162 return RTEXITCODE_SUCCESS;
163}
164
165
166/**
167 * Displays a disassembly error and returns @c false.
168 *
169 * @returns @c false.
170 * @param pszFormat The error format string.
171 * @param ... Format argument.
172 */
173static bool disError(const char *pszFormat, ...)
174{
175 va_list va;
176 va_start(va, pszFormat);
177 RTMsgErrorV(pszFormat, va);
178 va_end(va);
179 return false;
180}
181
182
183/**
184 * Output the disassembly file header.
185 *
186 * @returns @c true on success,
187 */
188static bool disFileHeader(void)
189{
190 bool fRc;
191 fRc = outputPrintf("; $Id: MakeDebianBiosAssembly.cpp 41668 2012-06-12 13:15:51Z vboxsync $ \n"
192 ";; @file\n"
193 "; Auto Generated source file. Do not edit.\n"
194 ";\n"
195 );
196 if (!fRc)
197 return fRc;
198
199 /*
200 * List the header of each source file, up to and including the
201 * copyright notice.
202 */
203 PBIOSOBJFILE pObjFile;
204 RTListForEach(&g_ObjList, pObjFile, BIOSOBJFILE, Node)
205 {
206 PRTSTREAM hStrm;
207 int rc = RTStrmOpen(pObjFile->pszSource, "r", &hStrm);
208 if (RT_SUCCESS(rc))
209 {
210 fRc = outputPrintf("\n"
211 ";\n"
212 "; Source file: %Rbn\n"
213 ";\n"
214 , pObjFile->pszSource);
215 uint32_t iLine = 0;
216 bool fSeenCopyright = false;
217 char szLine[4096];
218 while ((rc = RTStrmGetLine(hStrm, szLine, sizeof(szLine))) == VINF_SUCCESS)
219 {
220 iLine++;
221
222 /* Check if we're done. */
223 char *psz = RTStrStrip(szLine);
224 if ( fSeenCopyright
225 && ( (psz[0] == '*' && psz[1] == '/')
226 || psz[0] == '\0') )
227 break;
228
229 /* Strip comment suffix. */
230 size_t cch = strlen(psz);
231 if (cch >= 2 && psz[cch - 1] == '/' && psz[cch - 2] == '*')
232 {
233 psz[cch - 2] = '\0';
234 RTStrStripR(psz);
235 }
236
237 /* Skip line prefix. */
238 if (psz[0] == '/' && psz[1] == '*')
239 psz += 2;
240 else if (psz[0] == '*')
241 psz += 1;
242 else
243 while (*psz == ';')
244 psz++;
245 if (RT_C_IS_SPACE(*psz))
246 psz++;
247
248 /* Skip the doxygen file tag line. */
249 if (!strcmp(psz, "* @file") || !strcmp(psz, "@file"))
250 continue;
251
252 /* Detect copyright section. */
253 if ( !fSeenCopyright
254 && ( strstr(psz, "Copyright")
255 || strstr(psz, "copyright")) )
256 fSeenCopyright = true;
257
258 fRc = outputPrintf("; %s\n", psz) && fRc;
259 }
260
261 RTStrmClose(hStrm);
262 if (rc != VINF_SUCCESS)
263 return disError("Error reading '%s': rc=%Rrc iLine=%u", pObjFile->pszSource, rc, iLine);
264 }
265 }
266
267 /*
268 * Set the org.
269 */
270 fRc = outputPrintf("\n"
271 "\n"
272 "\n"
273 ) && fRc;
274 return fRc;
275}
276
277
278/**
279 * Checks if a byte sequence could be a string litteral.
280 *
281 * @returns @c true if it is, @c false if it isn't.
282 * @param uFlatAddr The address of the byte sequence.
283 * @param cb The length of the sequence.
284 */
285static bool disIsString(uint32_t uFlatAddr, uint32_t cb)
286{
287 if (cb < 6)
288 return false;
289
290 uint8_t const *pb = &g_pbImg[uFlatAddr - VBOX_BIOS_BASE];
291 while (cb > 0)
292 {
293 if ( !RT_C_IS_PRINT(*pb)
294 && *pb != '\r'
295 && *pb != '\n'
296 && *pb != '\t')
297 {
298 if (*pb == '\0')
299 {
300 do
301 {
302 pb++;
303 cb--;
304 } while (cb > 0 && *pb == '\0');
305 return cb == 0;
306 }
307 return false;
308 }
309 pb++;
310 cb--;
311 }
312
313 return true;
314}
315
316
317/**
318 * Checks if a dword could be a far 16:16 BIOS address.
319 *
320 * @returns @c true if it is, @c false if it isn't.
321 * @param uFlatAddr The address of the dword.
322 */
323static bool disIsFarBiosAddr(uint32_t uFlatAddr)
324{
325 uint16_t const *pu16 = (uint16_t const *)&g_pbImg[uFlatAddr - VBOX_BIOS_BASE];
326 if (pu16[1] < 0xf000)
327 return false;
328 if (pu16[1] > 0xfff0)
329 return false;
330 uint32_t uFlatAddr2 = (uint32_t)(pu16[1] << 4) | pu16[0];
331 if (uFlatAddr2 >= VBOX_BIOS_BASE + _64K)
332 return false;
333 return true;
334}
335
336
337static bool disByteData(uint32_t uFlatAddr, uint32_t cb)
338{
339 uint8_t const *pb = &g_pbImg[uFlatAddr - VBOX_BIOS_BASE];
340 size_t cbOnLine = 0;
341 while (cb-- > 0)
342 {
343 bool fRc;
344 if (cbOnLine >= 16)
345 {
346 fRc = outputPrintf("\n"
347 " db 0%02xh", *pb);
348 cbOnLine = 1;
349 }
350 else if (!cbOnLine)
351 {
352 fRc = outputPrintf(" db 0%02xh", *pb);
353 cbOnLine = 1;
354 }
355 else
356 {
357 fRc = outputPrintf(", 0%02xh", *pb);
358 cbOnLine++;
359 }
360 if (!fRc)
361 return false;
362 pb++;
363 }
364 return outputPrintf("\n");
365}
366
367
368static bool disWordData(uint32_t uFlatAddr, uint32_t cb)
369{
370 if (cb & 1)
371 return disError("disWordData expects word aligned size: cb=%#x uFlatAddr=%#x", uFlatAddr, cb);
372
373 uint16_t const *pu16 = (uint16_t const *)&g_pbImg[uFlatAddr - VBOX_BIOS_BASE];
374 size_t cbOnLine = 0;
375 while (cb > 0)
376 {
377 bool fRc;
378 if (cbOnLine >= 16)
379 {
380 fRc = outputPrintf("\n"
381 " dw 0%04xh", *pu16);
382 cbOnLine = 2;
383 }
384 else if (!cbOnLine)
385 {
386 fRc = outputPrintf(" dw 0%04xh", *pu16);
387 cbOnLine = 2;
388 }
389 else
390 {
391 fRc = outputPrintf(", 0%04xh", *pu16);
392 cbOnLine += 2;
393 }
394 if (!fRc)
395 return false;
396 pu16++;
397 cb -= 2;
398 }
399 return outputPrintf("\n");
400}
401
402
403static bool disDWordData(uint32_t uFlatAddr, uint32_t cb)
404{
405 if (cb & 3)
406 return disError("disWordData expects dword aligned size: cb=%#x uFlatAddr=%#x", uFlatAddr, cb);
407
408 uint32_t const *pu32 = (uint32_t const *)&g_pbImg[uFlatAddr - VBOX_BIOS_BASE];
409 size_t cbOnLine = 0;
410 while (cb > 0)
411 {
412 bool fRc;
413 if (cbOnLine >= 16)
414 {
415 fRc = outputPrintf("\n"
416 " dd 0%08xh", *pu32);
417 cbOnLine = 4;
418 }
419 else if (!cbOnLine)
420 {
421 fRc = outputPrintf(" dd 0%08xh", *pu32);
422 cbOnLine = 4;
423 }
424 else
425 {
426 fRc = outputPrintf(", 0%08xh", *pu32);
427 cbOnLine += 4;
428 }
429 if (!fRc)
430 return false;
431 pu32++;
432 cb -= 4;
433 }
434 return outputPrintf("\n");
435}
436
437
438static bool disStringData(uint32_t uFlatAddr, uint32_t cb)
439{
440 uint8_t const *pb = &g_pbImg[uFlatAddr - VBOX_BIOS_BASE];
441 uint32_t cchOnLine = 0;
442 while (cb > 0)
443 {
444 /* Line endings and beginnings. */
445 if (cchOnLine >= 72)
446 {
447 if (!outputPrintf("\n"))
448 return false;
449 cchOnLine = 0;
450 }
451 if ( !cchOnLine
452 && !outputPrintf(" db "))
453 return false;
454
455 /* See how many printable character we've got. */
456 uint32_t cchPrintable = 0;
457 while ( cchPrintable < cb
458 && RT_C_IS_PRINT(pb[cchPrintable])
459 && pb[cchPrintable] != '\'')
460 cchPrintable++;
461
462 bool fRc = true;
463 if (cchPrintable)
464 {
465 if (cchPrintable + cchOnLine > 72)
466 cchPrintable = 72 - cchOnLine;
467 if (cchOnLine)
468 {
469 fRc = outputPrintf(", '%.*s'", cchPrintable, pb);
470 cchOnLine += 4 + cchPrintable;
471 }
472 else
473 {
474 fRc = outputPrintf("'%.*s'", cchPrintable, pb);
475 cchOnLine += 2 + cchPrintable;
476 }
477 pb += cchPrintable;
478 cb -= cchPrintable;
479 }
480 else
481 {
482 if (cchOnLine)
483 {
484 fRc = outputPrintf(", 0%02xh", *pb);
485 cchOnLine += 6;
486 }
487 else
488 {
489 fRc = outputPrintf("0%02xh", *pb);
490 cchOnLine += 4;
491 }
492 pb++;
493 cb--;
494 }
495 if (!fRc)
496 return false;
497 }
498 return outputPrintf("\n");
499}
500
501
502/**
503 * For dumping a portion of a string table.
504 *
505 * @returns @c true on success, @c false on failure.
506 * @param uFlatAddr The start address.
507 * @param cb The size of the string table.
508 */
509static bool disStringsData(uint32_t uFlatAddr, uint32_t cb)
510{
511 uint8_t const *pb = &g_pbImg[uFlatAddr - VBOX_BIOS_BASE];
512 uint32_t cchOnLine = 0;
513 uint8_t bPrev = 255;
514 while (cb > 0)
515 {
516 /* Line endings and beginnings. */
517 if ( cchOnLine >= 72
518 || (bPrev == '\0' && *pb != '\0'))
519 {
520 if (!outputPrintf("\n"))
521 return false;
522 cchOnLine = 0;
523 }
524 if ( !cchOnLine
525 && !outputPrintf(" db "))
526 return false;
527
528 /* See how many printable character we've got. */
529 uint32_t cchPrintable = 0;
530 while ( cchPrintable < cb
531 && RT_C_IS_PRINT(pb[cchPrintable])
532 && pb[cchPrintable] != '\'')
533 cchPrintable++;
534
535 bool fRc = true;
536 if (cchPrintable)
537 {
538 if (cchPrintable + cchOnLine > 72)
539 cchPrintable = 72 - cchOnLine;
540 if (cchOnLine)
541 {
542 fRc = outputPrintf(", '%.*s'", cchPrintable, pb);
543 cchOnLine += 4 + cchPrintable;
544 }
545 else
546 {
547 fRc = outputPrintf("'%.*s'", cchPrintable, pb);
548 cchOnLine += 2 + cchPrintable;
549 }
550 pb += cchPrintable;
551 cb -= cchPrintable;
552 }
553 else
554 {
555 if (cchOnLine)
556 {
557 fRc = outputPrintf(", 0%02xh", *pb);
558 cchOnLine += 6;
559 }
560 else
561 {
562 fRc = outputPrintf("0%02xh", *pb);
563 cchOnLine += 4;
564 }
565 pb++;
566 cb--;
567 }
568 if (!fRc)
569 return false;
570 bPrev = pb[-1];
571 }
572 return outputPrintf("\n");
573}
574
575
576/**
577 * Minds the gap between two segments.
578 *
579 * Gaps should generally be zero filled.
580 *
581 * @returns @c true on success, @c false on failure.
582 * @param uFlatAddr The address of the gap.
583 * @param cbPadding The size of the gap.
584 */
585static bool disCopySegmentGap(uint32_t uFlatAddr, uint32_t cbPadding)
586{
587 if (g_cVerbose > 0)
588 outputPrintf("\n"
589 " ; Padding %#x bytes at %#x\n", cbPadding, uFlatAddr);
590 uint8_t const *pb = &g_pbImg[uFlatAddr - VBOX_BIOS_BASE];
591 if (!ASMMemIsAll8(pb, cbPadding, 0))
592 return outputPrintf(" times %u db 0\n", cbPadding);
593
594 return disByteData(uFlatAddr, cbPadding);
595}
596
597
598/**
599 * Worker for disGetNextSymbol that only does the looking up, no RTDBSYMBOL::cb
600 * calc.
601 *
602 * @param uFlatAddr The address to start searching at.
603 * @param cbMax The size of the search range.
604 * @param poff Where to return the offset between the symbol
605 * and @a uFlatAddr.
606 * @param pSym Where to return the symbol data.
607 */
608static void disGetNextSymbolWorker(uint32_t uFlatAddr, uint32_t cbMax, uint32_t *poff, PRTDBGSYMBOL pSym)
609{
610 RTINTPTR off = 0;
611 int rc = RTDbgModSymbolByAddr(g_hMapMod, RTDBGSEGIDX_RVA, uFlatAddr, RTDBGSYMADDR_FLAGS_GREATER_OR_EQUAL, &off, pSym);
612 if (RT_SUCCESS(rc))
613 {
614 /* negative offset, indicates beyond. */
615 if (off <= 0)
616 {
617 *poff = (uint32_t)-off;
618 return;
619 }
620
621 outputPrintf(" ; !! RTDbgModSymbolByAddr(,,%#x,,) -> off=%RTptr cb=%RTptr uValue=%RTptr '%s'\n",
622 uFlatAddr, off, pSym->cb, pSym->Value, pSym->szName);
623 }
624 else if (rc != VERR_SYMBOL_NOT_FOUND)
625 outputPrintf(" ; !! RTDbgModSymbolByAddr(,,%#x,,) -> %Rrc\n", uFlatAddr, rc);
626
627 RTStrPrintf(pSym->szName, sizeof(pSym->szName), "_dummy_addr_%#x", uFlatAddr + cbMax);
628 pSym->Value = uFlatAddr + cbMax;
629 pSym->cb = 0;
630 pSym->offSeg = uFlatAddr + cbMax;
631 pSym->iSeg = RTDBGSEGIDX_RVA;
632 pSym->iOrdinal = 0;
633 pSym->fFlags = 0;
634 *poff = cbMax;
635}
636
637
638/**
639 * Gets the symbol at or after the given address.
640 *
641 * If there are no symbols in the specified range, @a pSym and @a poff will be
642 * set up to indicate a symbol at the first byte after the range.
643 *
644 * @param uFlatAddr The address to start searching at.
645 * @param cbMax The size of the search range.
646 * @param poff Where to return the offset between the symbol
647 * and @a uFlatAddr.
648 * @param pSym Where to return the symbol data.
649 */
650static void disGetNextSymbol(uint32_t uFlatAddr, uint32_t cbMax, uint32_t *poff, PRTDBGSYMBOL pSym)
651{
652 disGetNextSymbolWorker(uFlatAddr, cbMax, poff, pSym);
653 if ( *poff < cbMax
654 && pSym->cb == 0)
655 {
656 if (*poff + 1 < cbMax)
657 {
658 uint32_t off2;
659 RTDBGSYMBOL Sym2;
660 disGetNextSymbolWorker(uFlatAddr + *poff + 1, cbMax - *poff - 1, &off2, &Sym2);
661 pSym->cb = off2 + 1;
662 }
663 else
664 pSym->cb = 1;
665 }
666 if (pSym->cb > cbMax - *poff)
667 pSym->cb = cbMax - *poff;
668
669 if (g_cVerbose > 1)
670 outputPrintf(" ; disGetNextSymbol %#x LB %#x -> off=%#x cb=%RTptr uValue=%RTptr '%s'\n",
671 uFlatAddr, cbMax, *poff, pSym->cb, pSym->Value, pSym->szName);
672
673}
674
675
676/**
677 * For dealing with the const segment (string constants).
678 *
679 * @returns @c true on success, @c false on failure.
680 * @param iSeg The segment.
681 */
682static bool disConstSegment(uint32_t iSeg)
683{
684 uint32_t uFlatAddr = g_aSegs[iSeg].uFlatAddr;
685 uint32_t cb = g_aSegs[iSeg].cb;
686
687 while (cb > 0)
688 {
689 uint32_t off;
690 RTDBGSYMBOL Sym;
691 disGetNextSymbol(uFlatAddr, cb, &off, &Sym);
692
693 if (off > 0)
694 {
695 if (!disStringsData(uFlatAddr, off))
696 return false;
697 cb -= off;
698 uFlatAddr += off;
699 off = 0;
700 if (!cb)
701 break;
702 }
703
704 bool fRc;
705 if (off == 0)
706 {
707 size_t cchName = strlen(Sym.szName);
708 fRc = outputPrintf("%s: %*s; %#x LB %#x\n", Sym.szName, cchName < 41 - 2 ? cchName - 41 - 2 : 0, "", uFlatAddr, Sym.cb);
709 if (!fRc)
710 return false;
711 fRc = disStringsData(uFlatAddr, Sym.cb);
712 uFlatAddr += Sym.cb;
713 cb -= Sym.cb;
714 }
715 else
716 {
717 fRc = disStringsData(uFlatAddr, Sym.cb);
718 uFlatAddr += cb;
719 cb = 0;
720 }
721 if (!fRc)
722 return false;
723 }
724
725 return true;
726}
727
728
729
730static bool disDataSegment(uint32_t iSeg)
731{
732 uint32_t uFlatAddr = g_aSegs[iSeg].uFlatAddr;
733 uint32_t cb = g_aSegs[iSeg].cb;
734
735 while (cb > 0)
736 {
737 uint32_t off;
738 RTDBGSYMBOL Sym;
739 disGetNextSymbol(uFlatAddr, cb, &off, &Sym);
740
741 if (off > 0)
742 {
743 if (!disByteData(uFlatAddr, off))
744 return false;
745 cb -= off;
746 uFlatAddr += off;
747 off = 0;
748 if (!cb)
749 break;
750 }
751
752 bool fRc;
753 if (off == 0)
754 {
755 size_t cchName = strlen(Sym.szName);
756 fRc = outputPrintf("%s: %*s; %#x LB %#x\n", Sym.szName, cchName < 41 - 2 ? cchName - 41 - 2 : 0, "", uFlatAddr, Sym.cb);
757 if (!fRc)
758 return false;
759
760 if (Sym.cb == 2)
761 fRc = disWordData(uFlatAddr, 2);
762 //else if (Sym.cb == 4 && disIsFarBiosAddr(uFlatAddr))
763 // fRc = disDWordData(uFlatAddr, 4);
764 else if (Sym.cb == 4)
765 fRc = disDWordData(uFlatAddr, 4);
766 else if (disIsString(uFlatAddr, Sym.cb))
767 fRc = disStringData(uFlatAddr, Sym.cb);
768 else
769 fRc = disByteData(uFlatAddr, Sym.cb);
770
771 uFlatAddr += Sym.cb;
772 cb -= Sym.cb;
773 }
774 else
775 {
776 fRc = disByteData(uFlatAddr, cb);
777 uFlatAddr += cb;
778 cb = 0;
779 }
780 if (!fRc)
781 return false;
782 }
783
784 return true;
785}
786
787
788static bool disIsCodeAndAdjustSize(uint32_t uFlatAddr, PRTDBGSYMBOL pSym, PBIOSSEG pSeg)
789{
790 if (!strcmp(pSeg->szName, "BIOSSEG"))
791 {
792 if ( !strcmp(pSym->szName, "rom_fdpt")
793 || !strcmp(pSym->szName, "pmbios_gdt")
794 || !strcmp(pSym->szName, "pmbios_gdt_desc")
795 || !strcmp(pSym->szName, "_pmode_IDT")
796 || !strcmp(pSym->szName, "_rmode_IDT")
797 || !strncmp(pSym->szName, RT_STR_TUPLE("font"))
798 || !strcmp(pSym->szName, "bios_string")
799 || !strcmp(pSym->szName, "vector_table")
800 || !strcmp(pSym->szName, "pci_routing_table_structure")
801 )
802 return false;
803 }
804
805 if (!strcmp(pSym->szName, "cpu_reset"))
806 pSym->cb = RT_MIN(pSym->cb, 5);
807 else if (!strcmp(pSym->szName, "pci_init_end"))
808 pSym->cb = RT_MIN(pSym->cb, 3);
809
810 return true;
811}
812
813
814static bool disIs16BitCode(const char *pszSymbol)
815{
816 return true;
817}
818
819
820/**
821 * Deals with instructions that YASM will assemble differently than WASM/WCC.
822 */
823static size_t disHandleYasmDifferences(PDISCPUSTATE pCpuState, uint32_t uFlatAddr, uint32_t cbInstr,
824 char *pszBuf, size_t cbBuf, size_t cchUsed)
825{
826 bool fDifferent = DISFormatYasmIsOddEncoding(pCpuState);
827 uint8_t const *pb = &g_pbImg[uFlatAddr - VBOX_BIOS_BASE];
828
829 /*
830 * Disassembler bugs.
831 */
832 /** @todo Group 1a and 11 seems to be disassembled incorrectly when
833 * modrm.reg != 0. Those encodings should be invalid AFAICT. */
834
835 if ( ( pCpuState->opcode == 0x8f /* group 1a */
836 || pCpuState->opcode == 0xc7 /* group 11 */
837 || pCpuState->opcode == 0xc6 /* group 11 - not verified */
838 )
839 && pCpuState->ModRM.Bits.Reg != 0)
840 fDifferent = true;
841 /** @todo "TEST Eb,Ib" (f6 0f 08) ends up with no mnemonic as well as
842 * wrong length (2 instead of 3)! */
843 else if ( pCpuState->opcode == 0xf6
844 && pb[1] == 0x0f
845 && pb[2] == 0x08
846 && RT_C_IS_SPACE(*pszBuf) )
847 fDifferent = true;
848 /** @todo "INSB Yb,DX" (6c) ends up with no mnemonic here. */
849 else if (pCpuState->opcode == 0x6c && RT_C_IS_SPACE(*pszBuf))
850 fDifferent = true;
851 /*
852 * Check these out and consider adding them to DISFormatYasmIsOddEncoding.
853 */
854 else if ( pb[0] == 0xf3
855 && pb[1] == 0x66
856 && pb[2] == 0x6d)
857 fDifferent = true; /* rep insd - prefix switched. */
858 else if ( pb[0] == 0xc6
859 && pb[1] == 0xc5
860 && pb[2] == 0xba)
861 fDifferent = true; /* mov ch, 0bah - yasm uses a short sequence: 0xb5 0xba. */
862 /*
863 * Switch table fun (.sym may help):
864 */
865#if 0
866 else if ( pb[0] == 0x64
867 && pb[1] == 0x65
868 && pb[2] == 0x05
869 /*&& pb[3] == 0x61
870 && pb[4] == 0x19*/)
871 fDifferent = true; /* gs add ax, 01961h - both fs and gs prefix. Probably some switch table. */
872 else if ( pb[0] == 0x65
873 && pb[1] == 0x36
874 && pb[2] == 0x65
875 && pb[3] == 0xae)
876 fDifferent = true; /* gs scasb - switch table or smth. */
877 else if ( pb[0] == 0x67
878 && pb[1] == 0xe7
879 /*&& pb[2] == 0x67*/)
880 fDifferent = true; /* out 067h, ax - switch table or smth. */
881#endif
882
883
884 /*
885 * Handle different stuff.
886 */
887 if (fDifferent)
888 {
889 disByteData(uFlatAddr, cbInstr); /* lazy bird. */
890
891 if (cchUsed + 2 < cbBuf)
892 {
893 memmove(pszBuf + 2, pszBuf, cchUsed + 2);
894 cchUsed += 2;
895 }
896
897 pszBuf[0] = ';';
898 pszBuf[1] = ' ';
899 }
900
901 return cchUsed;
902}
903
904
905/**
906 * @callback_method_impl{FNDISREADBYTES}
907 *
908 * @remarks @a uSrcAddr is the flat address.
909 */
910static DECLCALLBACK(int) disReadOpcodeBytes(PDISCPUSTATE pDisState, uint8_t *pbDst, RTUINTPTR uSrcAddr, uint32_t cbToRead)
911{
912 if (uSrcAddr + cbToRead >= VBOX_BIOS_BASE + _64K)
913 {
914 RT_BZERO(pbDst, cbToRead);
915 if (uSrcAddr >= VBOX_BIOS_BASE + _64K)
916 cbToRead = 0;
917 else
918 cbToRead = VBOX_BIOS_BASE + _64K - uSrcAddr;
919 }
920 memcpy(pbDst, &g_pbImg[uSrcAddr - VBOX_BIOS_BASE], cbToRead);
921 NOREF(pDisState);
922 return VINF_SUCCESS;
923}
924
925
926/**
927 * Disassembles code.
928 *
929 * @returns @c true on success, @c false on failure.
930 * @param uFlatAddr The address where the code starts.
931 * @param cb The amount of code to disassemble.
932 * @param fIs16Bit Is is 16-bit (@c true) or 32-bit (@c false).
933 */
934static bool disCode(uint32_t uFlatAddr, uint32_t cb, bool fIs16Bit)
935{
936 uint8_t const *pb = &g_pbImg[uFlatAddr - VBOX_BIOS_BASE];
937
938 while (cb > 0)
939 {
940 /* Trailing zero padding detection. */
941 if ( *pb == '\0'
942 && ASMMemIsAll8(pb, RT_MIN(cb, 8), 0) == NULL)
943 {
944 void *pv = ASMMemIsAll8(pb, cb, 0);
945 uint32_t cbZeros = pv ? (uint32_t)((uint8_t const *)pv - pb) : cb;
946 if (!outputPrintf(" times %#x db 0\n", cbZeros))
947 return false;
948 cb -= cbZeros;
949 pb += cbZeros;
950 uFlatAddr += cbZeros;
951 if ( cb == 2
952 && pb[0] == 'X'
953 && pb[1] == 'M')
954 return disStringData(uFlatAddr, cb);
955 }
956 /* Work arounds for switch tables and such (disas assertions). */
957 else if ( ( pb[0] == 0x11 /* int13_cdemu switch */
958 && pb[1] == 0xda
959 && pb[2] == 0x05
960 && pb[3] == 0xff
961 && pb[4] == 0xff
962 )
963 || 0
964 )
965 return disByteData(uFlatAddr, cb);
966 else
967 {
968 unsigned cbInstr;
969 DISCPUSTATE CpuState;
970 int rc = DISCoreOneWithReader(uFlatAddr, fIs16Bit ? CPUMODE_16BIT : CPUMODE_32BIT,
971 disReadOpcodeBytes, NULL, &CpuState, &cbInstr);
972 if ( RT_SUCCESS(rc)
973 && cbInstr <= cb)
974 {
975 char szTmp[4096];
976 size_t cch = DISFormatYasmEx(&CpuState, szTmp, sizeof(szTmp),
977 DIS_FMT_FLAGS_STRICT
978 | DIS_FMT_FLAGS_BYTES_RIGHT | DIS_FMT_FLAGS_BYTES_COMMENT | DIS_FMT_FLAGS_BYTES_SPACED,
979 NULL, NULL);
980 cch = disHandleYasmDifferences(&CpuState, uFlatAddr, cbInstr, szTmp, sizeof(szTmp), cch);
981 Assert(cch < sizeof(szTmp));
982
983 if (g_cVerbose > 1)
984 {
985 while (cch < 72)
986 szTmp[cch++] = ' ';
987 RTStrPrintf(&szTmp[cch], sizeof(szTmp) - cch, "; %#x", uFlatAddr);
988 }
989
990 if (!outputPrintf(" %s\n", szTmp))
991 return false;
992 cb -= cbInstr;
993 pb += cbInstr;
994 uFlatAddr += cbInstr;
995 }
996 else
997 {
998 if (!disByteData(uFlatAddr, 1))
999 return false;
1000 cb--;
1001 pb++;
1002 uFlatAddr++;
1003 }
1004 }
1005 }
1006 return true;
1007}
1008
1009
1010static bool disCodeSegment(uint32_t iSeg)
1011{
1012 uint32_t uFlatAddr = g_aSegs[iSeg].uFlatAddr;
1013 uint32_t cb = g_aSegs[iSeg].cb;
1014
1015 while (cb > 0)
1016 {
1017 uint32_t off;
1018 RTDBGSYMBOL Sym;
1019 disGetNextSymbol(uFlatAddr, cb, &off, &Sym);
1020
1021 if (off > 0)
1022 {
1023 if (!disByteData(uFlatAddr, off))
1024 return false;
1025 cb -= off;
1026 uFlatAddr += off;
1027 off = 0;
1028 if (!cb)
1029 break;
1030 }
1031
1032 bool fRc;
1033 if (off == 0)
1034 {
1035 size_t cchName = strlen(Sym.szName);
1036 fRc = outputPrintf("%s: %*s; %#x LB %#x\n", Sym.szName, cchName < 41 - 2 ? cchName - 41 - 2 : 0, "", uFlatAddr, Sym.cb);
1037 if (!fRc)
1038 return false;
1039
1040 if (disIsCodeAndAdjustSize(uFlatAddr, &Sym, &g_aSegs[iSeg]))
1041 fRc = disCode(uFlatAddr, Sym.cb, disIs16BitCode(Sym.szName));
1042 else
1043 fRc = disByteData(uFlatAddr, Sym.cb);
1044
1045 uFlatAddr += Sym.cb;
1046 cb -= Sym.cb;
1047 }
1048 else
1049 {
1050 fRc = disByteData(uFlatAddr, cb);
1051 uFlatAddr += cb;
1052 cb = 0;
1053 }
1054 if (!fRc)
1055 return false;
1056 }
1057
1058 return true;
1059}
1060
1061
1062static RTEXITCODE DisassembleBiosImage(void)
1063{
1064 if (!disFileHeader())
1065 return RTEXITCODE_FAILURE;
1066
1067 /*
1068 * Work the image segment by segment.
1069 */
1070 bool fRc = true;
1071 uint32_t uFlatAddr = VBOX_BIOS_BASE;
1072 for (uint32_t iSeg = 0; iSeg < g_cSegs && fRc; iSeg++)
1073 {
1074 /* Is there a gap between the segments? */
1075 if (uFlatAddr < g_aSegs[iSeg].uFlatAddr)
1076 {
1077 fRc = disCopySegmentGap(uFlatAddr, g_aSegs[iSeg].uFlatAddr - uFlatAddr);
1078 if (!fRc)
1079 break;
1080 uFlatAddr = g_aSegs[iSeg].uFlatAddr;
1081 }
1082 else if (uFlatAddr > g_aSegs[iSeg].uFlatAddr)
1083 return RTMsgErrorExit(RTEXITCODE_FAILURE, "Overlapping segments: %u and %u; uFlatAddr=%#x\n", iSeg - 1, iSeg, uFlatAddr);
1084
1085 /* Disassemble the segment. */
1086 fRc = outputPrintf("\n"
1087 "section %s progbits vstart=%#x align=1 ; size=%#x class=%s group=%s\n",
1088 g_aSegs[iSeg].szName, g_aSegs[iSeg].uFlatAddr - VBOX_BIOS_BASE,
1089 g_aSegs[iSeg].cb, g_aSegs[iSeg].szClass, g_aSegs[iSeg].szGroup);
1090 if (!fRc)
1091 return RTEXITCODE_FAILURE;
1092 if (!strcmp(g_aSegs[iSeg].szName, "CONST"))
1093 fRc = disConstSegment(iSeg);
1094 else if (!strcmp(g_aSegs[iSeg].szClass, "DATA"))
1095 fRc = disDataSegment(iSeg);
1096 else
1097 fRc = disCodeSegment(iSeg);
1098
1099 /* Advance. */
1100 uFlatAddr += g_aSegs[iSeg].cb;
1101 }
1102
1103 /* Final gap. */
1104 if (uFlatAddr < VBOX_BIOS_BASE + _64K)
1105 fRc = disCopySegmentGap(uFlatAddr, VBOX_BIOS_BASE + _64K - uFlatAddr);
1106 else if (uFlatAddr > VBOX_BIOS_BASE + _64K)
1107 return RTMsgErrorExit(RTEXITCODE_FAILURE, "Last segment spills beyond 1MB; uFlatAddr=%#x\n", uFlatAddr);
1108
1109 if (!fRc)
1110 return RTEXITCODE_FAILURE;
1111 return RTEXITCODE_SUCCESS;
1112}
1113
1114
1115
1116/**
1117 * Parses the symbol file for the BIOS.
1118 *
1119 * This is in ELF/DWARF format.
1120 *
1121 * @returns RTEXITCODE_SUCCESS or RTEXITCODE_FAILURE+msg.
1122 * @param pszBiosSym Path to the sym file.
1123 */
1124static RTEXITCODE ParseSymFile(const char *pszBiosSym)
1125{
1126#if 1
1127 /** @todo use RTDbg* later. (Just checking for existance currently.) */
1128 PRTSTREAM hStrm;
1129 int rc = RTStrmOpen(pszBiosSym, "rb", &hStrm);
1130 if (RT_FAILURE(rc))
1131 return RTMsgErrorExit(RTEXITCODE_FAILURE, "Error opening '%s': %Rrc", pszBiosSym, rc);
1132 RTStrmClose(hStrm);
1133#else
1134 RTDBGMOD hDbgMod;
1135 int rc = RTDbgModCreateFromImage(&hDbgMod, pszBiosSym, "VBoxBios", 0 /*fFlags*/);
1136 RTMsgInfo("RTDbgModCreateFromImage -> %Rrc\n", rc);
1137#endif
1138 return RTEXITCODE_SUCCESS;
1139}
1140
1141
1142/**
1143 * Display an error with the mapfile name and current line, return false.
1144 *
1145 * @returns @c false.
1146 * @param pMap The map file handle.
1147 * @param pszFormat The format string.
1148 * @param ... Format arguments.
1149 */
1150static bool mapError(PBIOSMAP pMap, const char *pszFormat, ...)
1151{
1152 va_list va;
1153 va_start(va, pszFormat);
1154 RTMsgError("%s:%d: %N", pMap->pszMapFile, pMap->iLine, pszFormat, va);
1155 va_end(va);
1156 return false;
1157}
1158
1159
1160/**
1161 * Reads a line from the file.
1162 *
1163 * @returns @c true on success, @c false + msg on failure, @c false on eof.
1164 * @param pMap The map file handle.
1165 */
1166static bool mapReadLine(PBIOSMAP pMap)
1167{
1168 int rc = RTStrmGetLine(pMap->hStrm, pMap->szLine, sizeof(pMap->szLine));
1169 if (RT_FAILURE(rc))
1170 {
1171 if (rc == VERR_EOF)
1172 {
1173 pMap->fEof = true;
1174 pMap->cch = 0;
1175 pMap->offNW = 0;
1176 pMap->szLine[0] = '\0';
1177 }
1178 else
1179 RTMsgError("%s:%d: Read error %Rrc", pMap->pszMapFile, pMap->iLine + 1, rc);
1180 return false;
1181 }
1182 pMap->iLine++;
1183 pMap->cch = (uint32_t)strlen(pMap->szLine);
1184
1185 /* Check out leading white space. */
1186 if (!RT_C_IS_SPACE(pMap->szLine[0]))
1187 pMap->offNW = 0;
1188 else
1189 {
1190 uint32_t off = 1;
1191 while (RT_C_IS_SPACE(pMap->szLine[off]))
1192 off++;
1193 pMap->offNW = off;
1194 }
1195
1196 return true;
1197}
1198
1199
1200/**
1201 * Checks if it is an empty line.
1202 * @returns @c true if empty, @c false if not.
1203 * @param pMap The map file handle.
1204 */
1205static bool mapIsEmptyLine(PBIOSMAP pMap)
1206{
1207 Assert(pMap->offNW <= pMap->cch);
1208 return pMap->offNW == pMap->cch;
1209}
1210
1211
1212/**
1213 * Reads ahead in the map file until a non-empty line or EOF is encountered.
1214 *
1215 * @returns @c true on success, @c false + msg on failure, @c false on eof.
1216 * @param pMap The map file handle.
1217 */
1218static bool mapSkipEmptyLines(PBIOSMAP pMap)
1219{
1220 for (;;)
1221 {
1222 if (!mapReadLine(pMap))
1223 return false;
1224 if (pMap->offNW < pMap->cch)
1225 return true;
1226 }
1227}
1228
1229
1230/**
1231 * Reads ahead in the map file until an empty line or EOF is encountered.
1232 *
1233 * @returns @c true on success, @c false + msg on failure, @c false on eof.
1234 * @param pMap The map file handle.
1235 */
1236static bool mapSkipNonEmptyLines(PBIOSMAP pMap)
1237{
1238 for (;;)
1239 {
1240 if (!mapReadLine(pMap))
1241 return false;
1242 if (pMap->offNW == pMap->cch)
1243 return true;
1244 }
1245}
1246
1247
1248/**
1249 * Strips the current line.
1250 *
1251 * The string length may change.
1252 *
1253 * @returns Pointer to the first non-space character.
1254 * @param pMap The map file handle.
1255 * @param pcch Where to return the length of the unstripped
1256 * part. Optional.
1257 */
1258static char *mapStripCurrentLine(PBIOSMAP pMap, size_t *pcch)
1259{
1260 char *psz = &pMap->szLine[pMap->offNW];
1261 char *pszEnd = &pMap->szLine[pMap->cch];
1262 while ( (uintptr_t)pszEnd > (uintptr_t)psz
1263 && RT_C_IS_SPACE(pszEnd[-1]))
1264 {
1265 *--pszEnd = '\0';
1266 pMap->cch--;
1267 }
1268 if (pcch)
1269 *pcch = pszEnd - psz;
1270 return psz;
1271}
1272
1273
1274/**
1275 * Reads a line from the file and right strips it.
1276 *
1277 * @returns Pointer to szLine on success, @c NULL + msg on failure, @c NULL on
1278 * EOF.
1279 * @param pMap The map file handle.
1280 * @param pcch Where to return the length of the unstripped
1281 * part. Optional.
1282 */
1283static char *mapReadLineStripRight(PBIOSMAP pMap, size_t *pcch)
1284{
1285 if (!mapReadLine(pMap))
1286 return NULL;
1287 mapStripCurrentLine(pMap, NULL);
1288 if (pcch)
1289 *pcch = pMap->cch;
1290 return pMap->szLine;
1291}
1292
1293
1294/**
1295 * mapReadLine() + mapStripCurrentLine().
1296 *
1297 * @returns Pointer to the first non-space character in the new line. NULL on
1298 * read error (bitched already) or end of file.
1299 * @param pMap The map file handle.
1300 * @param pcch Where to return the length of the unstripped
1301 * part. Optional.
1302 */
1303static char *mapReadLineStrip(PBIOSMAP pMap, size_t *pcch)
1304{
1305 if (!mapReadLine(pMap))
1306 return NULL;
1307 return mapStripCurrentLine(pMap, pcch);
1308}
1309
1310
1311/**
1312 * Parses a word, copying it into the supplied buffer, and skipping any spaces
1313 * following it.
1314 *
1315 * @returns @c true on success, @c false on failure.
1316 * @param ppszCursor Pointer to the cursor variable.
1317 * @param pszBuf The output buffer.
1318 * @param cbBuf The size of the output buffer.
1319 */
1320static bool mapParseWord(char **ppszCursor, char *pszBuf, size_t cbBuf)
1321{
1322 /* Check that we start on a non-blank. */
1323 char *pszStart = *ppszCursor;
1324 if (!*pszStart || RT_C_IS_SPACE(*pszStart))
1325 return false;
1326
1327 /* Find the end of the word. */
1328 char *psz = pszStart + 1;
1329 while (*psz && !RT_C_IS_SPACE(*psz))
1330 psz++;
1331
1332 /* Copy it. */
1333 size_t cchWord = (uintptr_t)psz - (uintptr_t)pszStart;
1334 if (cchWord >= cbBuf)
1335 return false;
1336 memcpy(pszBuf, pszStart, cchWord);
1337 pszBuf[cchWord] = '\0';
1338
1339 /* Skip blanks following it. */
1340 while (RT_C_IS_SPACE(*psz))
1341 psz++;
1342 *ppszCursor = psz;
1343 return true;
1344}
1345
1346
1347/**
1348 * Parses an 16:16 address.
1349 *
1350 * @returns @c true on success, @c false on failure.
1351 * @param ppszCursor Pointer to the cursor variable.
1352 * @param pAddr Where to return the address.
1353 */
1354static bool mapParseAddress(char **ppszCursor, PRTFAR16 pAddr)
1355{
1356 char szWord[32];
1357 if (!mapParseWord(ppszCursor, szWord, sizeof(szWord)))
1358 return false;
1359 size_t cchWord = strlen(szWord);
1360
1361 /* An address is at least 16:16 format. It may be 16:32. It may also be flagged. */
1362 size_t cchAddr = 4 + 1 + 4;
1363 if (cchWord < cchAddr)
1364 return false;
1365 if ( !RT_C_IS_XDIGIT(szWord[0])
1366 || !RT_C_IS_XDIGIT(szWord[1])
1367 || !RT_C_IS_XDIGIT(szWord[2])
1368 || !RT_C_IS_XDIGIT(szWord[3])
1369 || szWord[4] != ':'
1370 || !RT_C_IS_XDIGIT(szWord[5])
1371 || !RT_C_IS_XDIGIT(szWord[6])
1372 || !RT_C_IS_XDIGIT(szWord[7])
1373 || !RT_C_IS_XDIGIT(szWord[8])
1374 )
1375 return false;
1376 if ( cchWord > cchAddr
1377 && RT_C_IS_XDIGIT(szWord[9])
1378 && RT_C_IS_XDIGIT(szWord[10])
1379 && RT_C_IS_XDIGIT(szWord[11])
1380 && RT_C_IS_XDIGIT(szWord[12]))
1381 cchAddr += 4;
1382
1383 /* Drop flag if present. */
1384 if (cchWord > cchAddr)
1385 {
1386 if (RT_C_IS_XDIGIT(szWord[4+1+4]))
1387 return false;
1388 szWord[cchAddr] = '\0';
1389 cchWord = cchAddr;
1390 }
1391
1392 /* Convert it. */
1393 szWord[4] = '\0';
1394 int rc1 = RTStrToUInt16Full(szWord, 16, &pAddr->sel);
1395 if (rc1 != VINF_SUCCESS)
1396 return false;
1397
1398 int rc2 = RTStrToUInt16Full(szWord + 5, 16, &pAddr->off);
1399 if (rc2 != VINF_SUCCESS)
1400 return false;
1401 return true;
1402}
1403
1404
1405/**
1406 * Parses a size.
1407 *
1408 * @returns @c true on success, @c false on failure.
1409 * @param ppszCursor Pointer to the cursor variable.
1410 * @param pcb Where to return the size.
1411 */
1412static bool mapParseSize(char **ppszCursor, uint32_t *pcb)
1413{
1414 char szWord[32];
1415 if (!mapParseWord(ppszCursor, szWord, sizeof(szWord)))
1416 return false;
1417 size_t cchWord = strlen(szWord);
1418 if (cchWord != 8)
1419 return false;
1420
1421 int rc = RTStrToUInt32Full(szWord, 16, pcb);
1422 if (rc != VINF_SUCCESS)
1423 return false;
1424 return true;
1425}
1426
1427
1428/**
1429 * Parses a section box and the following column header.
1430 *
1431 * @returns @c true on success, @c false + msg on failure, @c false on eof.
1432 * @param pMap Map file handle.
1433 * @param pszSectionNm The expected section name.
1434 * @param cColumns The number of columns.
1435 * @param ... The column names.
1436 */
1437static bool mapSkipThruColumnHeadings(PBIOSMAP pMap, const char *pszSectionNm, uint32_t cColumns, ...)
1438{
1439 if ( mapIsEmptyLine(pMap)
1440 && !mapSkipEmptyLines(pMap))
1441 return false;
1442
1443 /* +------------+ */
1444 size_t cch;
1445 char *psz = mapStripCurrentLine(pMap, &cch);
1446 if (!psz)
1447 return false;
1448
1449 if ( psz[0] != '+'
1450 || psz[1] != '-'
1451 || psz[2] != '-'
1452 || psz[3] != '-'
1453 || psz[cch - 4] != '-'
1454 || psz[cch - 3] != '-'
1455 || psz[cch - 2] != '-'
1456 || psz[cch - 1] != '+'
1457 )
1458 {
1459 RTMsgError("%s:%d: Expected section box: +-----...", pMap->pszMapFile, pMap->iLine);
1460 return false;
1461 }
1462
1463 /* | pszSectionNm | */
1464 psz = mapReadLineStrip(pMap, &cch);
1465 if (!psz)
1466 return false;
1467
1468 size_t cchSectionNm = strlen(pszSectionNm);
1469 if ( psz[0] != '|'
1470 || psz[1] != ' '
1471 || psz[2] != ' '
1472 || psz[3] != ' '
1473 || psz[cch - 4] != ' '
1474 || psz[cch - 3] != ' '
1475 || psz[cch - 2] != ' '
1476 || psz[cch - 1] != '|'
1477 || cch != 1 + 3 + cchSectionNm + 3 + 1
1478 || strncmp(&psz[4], pszSectionNm, cchSectionNm)
1479 )
1480 {
1481 RTMsgError("%s:%d: Expected section box: | %s |", pMap->pszMapFile, pMap->iLine, pszSectionNm);
1482 return false;
1483 }
1484
1485 /* +------------+ */
1486 psz = mapReadLineStrip(pMap, &cch);
1487 if (!psz)
1488 return false;
1489 if ( psz[0] != '+'
1490 || psz[1] != '-'
1491 || psz[2] != '-'
1492 || psz[3] != '-'
1493 || psz[cch - 4] != '-'
1494 || psz[cch - 3] != '-'
1495 || psz[cch - 2] != '-'
1496 || psz[cch - 1] != '+'
1497 )
1498 {
1499 RTMsgError("%s:%d: Expected section box: +-----...", pMap->pszMapFile, pMap->iLine);
1500 return false;
1501 }
1502
1503 /* There may be a few lines describing the table notation now, surrounded by blank lines. */
1504 do
1505 {
1506 psz = mapReadLineStripRight(pMap, &cch);
1507 if (!psz)
1508 return false;
1509 } while ( *psz == '\0'
1510 || ( !RT_C_IS_SPACE(psz[0])
1511 && RT_C_IS_SPACE(psz[1])
1512 && psz[2] == '='
1513 && RT_C_IS_SPACE(psz[3]))
1514 );
1515
1516 /* Should have the column heading now. */
1517 va_list va;
1518 va_start(va, cColumns);
1519 for (uint32_t i = 0; i < cColumns; i++)
1520 {
1521 const char *pszColumn = va_arg(va, const char *);
1522 size_t cchColumn = strlen(pszColumn);
1523 if ( strncmp(psz, pszColumn, cchColumn)
1524 || ( psz[cchColumn] != '\0'
1525 && !RT_C_IS_SPACE(psz[cchColumn])))
1526 {
1527 va_end(va);
1528 RTMsgError("%s:%d: Expected column '%s' found '%s'", pMap->pszMapFile, pMap->iLine, pszColumn, psz);
1529 return false;
1530 }
1531 psz += cchColumn;
1532 while (RT_C_IS_SPACE(*psz))
1533 psz++;
1534 }
1535 va_end(va);
1536
1537 /* The next line is the underlining. */
1538 psz = mapReadLineStripRight(pMap, &cch);
1539 if (!psz)
1540 return false;
1541 if (*psz != '=' || psz[cch - 1] != '=')
1542 {
1543 RTMsgError("%s:%d: Expected column header underlining", pMap->pszMapFile, pMap->iLine);
1544 return false;
1545 }
1546
1547 /* Skip one blank line. */
1548 psz = mapReadLineStripRight(pMap, &cch);
1549 if (!psz)
1550 return false;
1551 if (*psz)
1552 {
1553 RTMsgError("%s:%d: Expected blank line beneath the column headers", pMap->pszMapFile, pMap->iLine);
1554 return false;
1555 }
1556
1557 return true;
1558}
1559
1560
1561/**
1562 * Parses a segment list.
1563 *
1564 * @returns @c true on success, @c false + msg on failure, @c false on eof.
1565 * @param pMap The map file handle.
1566 */
1567static bool mapParseSegments(PBIOSMAP pMap)
1568{
1569 for (;;)
1570 {
1571 if (!mapReadLineStripRight(pMap, NULL))
1572 return false;
1573
1574 /* The end? The line should be empty. Expectes segment name to not
1575 start with a space. */
1576 if (!pMap->szLine[0] || RT_C_IS_SPACE(pMap->szLine[0]))
1577 {
1578 if (!pMap->szLine[0])
1579 return true;
1580 RTMsgError("%s:%u: Malformed segment line", pMap->pszMapFile, pMap->iLine);
1581 return false;
1582 }
1583
1584 /* Parse the segment line. */
1585 uint32_t iSeg = g_cSegs;
1586 if (iSeg >= RT_ELEMENTS(g_aSegs))
1587 {
1588 RTMsgError("%s:%u: Too many segments", pMap->pszMapFile, pMap->iLine);
1589 return false;
1590 }
1591
1592 char *psz = pMap->szLine;
1593 if (!mapParseWord(&psz, g_aSegs[iSeg].szName, sizeof(g_aSegs[iSeg].szName)))
1594 RTMsgError("%s:%u: Segment name parser error", pMap->pszMapFile, pMap->iLine);
1595 else if (!mapParseWord(&psz, g_aSegs[iSeg].szClass, sizeof(g_aSegs[iSeg].szClass)))
1596 RTMsgError("%s:%u: Segment class parser error", pMap->pszMapFile, pMap->iLine);
1597 else if (!mapParseWord(&psz, g_aSegs[iSeg].szGroup, sizeof(g_aSegs[iSeg].szGroup)))
1598 RTMsgError("%s:%u: Segment group parser error", pMap->pszMapFile, pMap->iLine);
1599 else if (!mapParseAddress(&psz, &g_aSegs[iSeg].Address))
1600 RTMsgError("%s:%u: Segment address parser error", pMap->pszMapFile, pMap->iLine);
1601 else if (!mapParseSize(&psz, &g_aSegs[iSeg].cb))
1602 RTMsgError("%s:%u: Segment size parser error", pMap->pszMapFile, pMap->iLine);
1603 else
1604 {
1605 g_aSegs[iSeg].uFlatAddr = ((uint32_t)g_aSegs[iSeg].Address.sel << 4) + g_aSegs[iSeg].Address.off;
1606 g_cSegs++;
1607 if (g_cVerbose > 2)
1608 RTStrmPrintf(g_pStdErr, "read segment at %08x / %04x:%04x LB %04x %s / %s / %s\n",
1609 g_aSegs[iSeg].uFlatAddr,
1610 g_aSegs[iSeg].Address.sel,
1611 g_aSegs[iSeg].Address.off,
1612 g_aSegs[iSeg].cb,
1613 g_aSegs[iSeg].szName,
1614 g_aSegs[iSeg].szClass,
1615 g_aSegs[iSeg].szGroup);
1616
1617 while (RT_C_IS_SPACE(*psz))
1618 psz++;
1619 if (!*psz)
1620 continue;
1621 RTMsgError("%s:%u: Junk at end of line", pMap->pszMapFile, pMap->iLine);
1622 }
1623 return false;
1624 }
1625}
1626
1627
1628/**
1629 * Sorts the segment array by flat address and adds them to the debug module.
1630 *
1631 * @returns @c true on success, @c false + msg on failure, @c false on eof.
1632 */
1633static bool mapSortAndAddSegments(void)
1634{
1635 for (uint32_t i = 0; i < g_cSegs; i++)
1636 {
1637 for (uint32_t j = i + 1; j < g_cSegs; j++)
1638 if (g_aSegs[j].uFlatAddr < g_aSegs[i].uFlatAddr)
1639 {
1640 BIOSSEG Tmp = g_aSegs[i];
1641 g_aSegs[i] = g_aSegs[j];
1642 g_aSegs[j] = Tmp;
1643 }
1644 if (g_cVerbose > 0)
1645 RTStrmPrintf(g_pStdErr, "segment at %08x / %04x:%04x LB %04x %s / %s / %s\n",
1646 g_aSegs[i].uFlatAddr,
1647 g_aSegs[i].Address.sel,
1648 g_aSegs[i].Address.off,
1649 g_aSegs[i].cb,
1650 g_aSegs[i].szName,
1651 g_aSegs[i].szClass,
1652 g_aSegs[i].szGroup);
1653
1654 RTDBGSEGIDX idx = i;
1655 int rc = RTDbgModSegmentAdd(g_hMapMod, g_aSegs[i].uFlatAddr, g_aSegs[i].cb, g_aSegs[i].szName, 0 /*fFlags*/, &idx);
1656 if (RT_FAILURE(rc))
1657 {
1658 RTMsgError("RTDbgModSegmentAdd failed on %s: %Rrc", g_aSegs[i].szName);
1659 return false;
1660 }
1661 }
1662 return true;
1663}
1664
1665
1666/**
1667 * Parses a segment list.
1668 *
1669 * @returns @c true on success, @c false + msg on failure, @c false on eof.
1670 * @param pMap The map file handle.
1671 */
1672static bool mapParseSymbols(PBIOSMAP pMap)
1673{
1674 for (;;)
1675 {
1676 if (!mapReadLineStripRight(pMap, NULL))
1677 return false;
1678
1679 /* The end? The line should be empty. Expectes segment name to not
1680 start with a space. */
1681 if (!pMap->szLine[0] || RT_C_IS_SPACE(pMap->szLine[0]))
1682 {
1683 if (!pMap->szLine[0])
1684 return true;
1685 return mapError(pMap, "Malformed symbol line");
1686 }
1687
1688 if (!strncmp(pMap->szLine, RT_STR_TUPLE("Module: ")))
1689 {
1690 /* Parse the module line. */
1691 size_t offObj = sizeof("Module: ") - 1;
1692 while (RT_C_IS_SPACE(pMap->szLine[offObj]))
1693 offObj++;
1694 size_t offSrc = offObj;
1695 char ch;
1696 while ((ch = pMap->szLine[offSrc]) != '(' && ch != '\0')
1697 offSrc++;
1698 size_t cchObj = offSrc - offObj;
1699
1700 offSrc++;
1701 size_t cchSrc = offSrc;
1702 while ((ch = pMap->szLine[cchSrc]) != ')' && ch != '\0')
1703 cchSrc++;
1704 cchSrc -= offSrc;
1705 if (ch != ')')
1706 return mapError(pMap, "Symbol/Module line parse error");
1707
1708 PBIOSOBJFILE pObjFile = (PBIOSOBJFILE)RTMemAllocZ(sizeof(*pObjFile) + cchSrc + cchObj + 2);
1709 if (!pObjFile)
1710 return mapError(pMap, "Out of memory");
1711 char *psz = (char *)(pObjFile + 1);
1712 pObjFile->pszObject = psz;
1713 memcpy(psz, &pMap->szLine[offObj], cchObj);
1714 psz += cchObj;
1715 *psz++ = '\0';
1716 pObjFile->pszSource = psz;
1717 memcpy(psz, &pMap->szLine[offSrc], cchSrc);
1718 psz[cchSrc] = '\0';
1719 RTListAppend(&g_ObjList, &pObjFile->Node);
1720 }
1721 else
1722 {
1723 /* Parse the segment line. */
1724 RTFAR16 Addr;
1725 char *psz = pMap->szLine;
1726 if (!mapParseAddress(&psz, &Addr))
1727 return mapError(pMap, "Symbol address parser error");
1728
1729 char szName[4096];
1730 if (!mapParseWord(&psz, szName, sizeof(szName)))
1731 return mapError(pMap, "Symbol name parser error");
1732
1733 uint32_t uFlatAddr = ((uint32_t)Addr.sel << 4) + Addr.off;
1734 if (uFlatAddr != 0)
1735 {
1736 int rc = RTDbgModSymbolAdd(g_hMapMod, szName, RTDBGSEGIDX_RVA, uFlatAddr, 0 /*cb*/, 0 /*fFlags*/, NULL);
1737 if (RT_FAILURE(rc) && rc != VERR_DBG_ADDRESS_CONFLICT)
1738 return mapError(pMap, "RTDbgModSymbolAdd failed: %Rrc", rc);
1739
1740 if (g_cVerbose > 2)
1741 RTStrmPrintf(g_pStdErr, "read symbol - %08x %s\n", uFlatAddr, szName);
1742 while (RT_C_IS_SPACE(*psz))
1743 psz++;
1744 if (*psz)
1745 return mapError(pMap, "Junk at end of line");
1746 }
1747
1748 }
1749 }
1750}
1751
1752
1753/**
1754 * Parses the given map file.
1755 *
1756 * @returns RTEXITCODE_SUCCESS and lots of globals, or RTEXITCODE_FAILURE and a
1757 * error message.
1758 * @param pMap The map file handle.
1759 */
1760static RTEXITCODE mapParseFile(PBIOSMAP pMap)
1761{
1762 int rc = RTDbgModCreate(&g_hMapMod, "VBoxBios", 0 /*cbSeg*/, 0 /*fFlags*/);
1763 if (RT_FAILURE(rc))
1764 return RTMsgErrorExit(RTEXITCODE_FAILURE, "RTDbgModCreate failed: %Rrc", rc);
1765
1766 /*
1767 * Read the header.
1768 */
1769 if (!mapReadLine(pMap))
1770 return RTEXITCODE_FAILURE;
1771 if (strncmp(pMap->szLine, RT_STR_TUPLE("Open Watcom Linker Version")))
1772 return RTMsgErrorExit(RTEXITCODE_FAILURE, "Unexpected map-file header: '%s'", pMap->szLine);
1773 if ( !mapSkipNonEmptyLines(pMap)
1774 || !mapSkipEmptyLines(pMap))
1775 return RTEXITCODE_FAILURE;
1776
1777 /*
1778 * Skip groups.
1779 */
1780 if (!mapSkipThruColumnHeadings(pMap, "Groups", 3, "Group", "Address", "Size", NULL))
1781 return RTEXITCODE_FAILURE;
1782 if (!mapSkipNonEmptyLines(pMap))
1783 return RTEXITCODE_FAILURE;
1784
1785 /*
1786 * Parse segments.
1787 */
1788 if (!mapSkipThruColumnHeadings(pMap, "Segments", 5, "Segment", "Class", "Group", "Address", "Size"))
1789 return RTEXITCODE_FAILURE;
1790 if (!mapParseSegments(pMap))
1791 return RTEXITCODE_FAILURE;
1792 if (!mapSortAndAddSegments())
1793 return RTEXITCODE_FAILURE;
1794
1795 /*
1796 * Parse symbols.
1797 */
1798 if (!mapSkipThruColumnHeadings(pMap, "Memory Map", 2, "Address", "Symbol"))
1799 return RTEXITCODE_FAILURE;
1800 if (!mapParseSymbols(pMap))
1801 return RTEXITCODE_FAILURE;
1802
1803 /* Ignore the rest of the file. */
1804 return RTEXITCODE_SUCCESS;
1805}
1806
1807
1808/**
1809 * Parses the linker map file for the BIOS.
1810 *
1811 * This is generated by the Watcom linker.
1812 *
1813 * @returns RTEXITCODE_SUCCESS or RTEXITCODE_FAILURE+msg.
1814 * @param pszBiosMap Path to the map file.
1815 */
1816static RTEXITCODE ParseMapFile(const char *pszBiosMap)
1817{
1818 BIOSMAP Map;
1819 Map.pszMapFile = pszBiosMap;
1820 Map.hStrm = NULL;
1821 Map.iLine = 0;
1822 Map.fEof = false;
1823 Map.cch = 0;
1824 Map.offNW = 0;
1825 int rc = RTStrmOpen(pszBiosMap, "r", &Map.hStrm);
1826 if (RT_FAILURE(rc))
1827 return RTMsgErrorExit(RTEXITCODE_FAILURE, "Error opening '%s': %Rrc", pszBiosMap, rc);
1828 RTEXITCODE rcExit = mapParseFile(&Map);
1829 RTStrmClose(Map.hStrm);
1830 return rcExit;
1831}
1832
1833
1834/**
1835 * Reads the BIOS image into memory (g_pbImg and g_cbImg).
1836 *
1837 * @returns RTEXITCODE_SUCCESS or RTEXITCODE_FAILURE+msg.
1838 * @param pszBiosImg Path to the image file.
1839 */
1840static RTEXITCODE ReadBiosImage(const char *pszBiosImg)
1841{
1842 void *pvImg;
1843 size_t cbImg;
1844 int rc = RTFileReadAll(pszBiosImg, &pvImg, &cbImg);
1845 if (RT_FAILURE(rc))
1846 return RTMsgErrorExit(RTEXITCODE_FAILURE, "Error reading '%s': %Rrc", pszBiosImg, rc);
1847 if (cbImg != _64K)
1848 {
1849 RTFileReadAllFree(pvImg, cbImg);
1850 return RTMsgErrorExit(RTEXITCODE_FAILURE, "The BIOS image %u bytes intead of 64KB", cbImg);
1851 }
1852
1853 g_pbImg = (uint8_t *)pvImg;
1854 g_cbImg = cbImg;
1855 return RTEXITCODE_SUCCESS;
1856}
1857
1858
1859int main(int argc, char **argv)
1860{
1861 int rc = RTR3InitExe(argc, &argv, 0);
1862 if (RT_FAILURE(rc))
1863 return RTMsgInitFailure(rc);
1864
1865 RTListInit(&g_ObjList);
1866
1867 /*
1868 * Option config.
1869 */
1870 static RTGETOPTDEF const s_aOpts[] =
1871 {
1872 { "--bios-image", 'i', RTGETOPT_REQ_STRING },
1873 { "--bios-map", 'm', RTGETOPT_REQ_STRING },
1874 { "--bios-sym", 's', RTGETOPT_REQ_STRING },
1875 { "--output", 'o', RTGETOPT_REQ_STRING },
1876 { "--verbose", 'v', RTGETOPT_REQ_NOTHING },
1877 { "--quiet", 'q', RTGETOPT_REQ_NOTHING },
1878 };
1879
1880 const char *pszBiosMap = NULL;
1881 const char *pszBiosSym = NULL;
1882 const char *pszBiosImg = NULL;
1883 const char *pszOutput = NULL;
1884
1885 RTGETOPTUNION ValueUnion;
1886 RTGETOPTSTATE GetOptState;
1887 rc = RTGetOptInit(&GetOptState, argc, argv, &s_aOpts[0], RT_ELEMENTS(s_aOpts), 1, RTGETOPTINIT_FLAGS_OPTS_FIRST);
1888 AssertReleaseRCReturn(rc, RTEXITCODE_FAILURE);
1889
1890 /*
1891 * Process the options.
1892 */
1893 while ((rc = RTGetOpt(&GetOptState, &ValueUnion)) != 0)
1894 {
1895 switch (rc)
1896 {
1897 case 'i':
1898 if (pszBiosImg)
1899 return RTMsgErrorExit(RTEXITCODE_SYNTAX, "--bios-image is given more than once");
1900 pszBiosImg = ValueUnion.psz;
1901 break;
1902
1903 case 'm':
1904 if (pszBiosMap)
1905 return RTMsgErrorExit(RTEXITCODE_SYNTAX, "--bios-map is given more than once");
1906 pszBiosMap = ValueUnion.psz;
1907 break;
1908
1909 case 's':
1910 if (pszBiosSym)
1911 return RTMsgErrorExit(RTEXITCODE_SYNTAX, "--bios-sym is given more than once");
1912 pszBiosSym = ValueUnion.psz;
1913 break;
1914
1915 case 'o':
1916 if (pszOutput)
1917 return RTMsgErrorExit(RTEXITCODE_SYNTAX, "--output is given more than once");
1918 pszOutput = ValueUnion.psz;
1919 break;
1920
1921 case 'v':
1922 g_cVerbose++;
1923 break;
1924
1925 case 'q':
1926 g_cVerbose = 0;
1927 break;
1928
1929 case 'H':
1930 RTPrintf("usage: %Rbn --bios-image <file.img> --bios-map <file.map> [--output <file.asm>]\n",
1931 argv[0]);
1932 return RTEXITCODE_SUCCESS;
1933
1934 case 'V':
1935 {
1936 /* The following is assuming that svn does it's job here. */
1937 RTPrintf("r%u\n", RTBldCfgRevision());
1938 return RTEXITCODE_SUCCESS;
1939 }
1940
1941 default:
1942 return RTGetOptPrintError(rc, &ValueUnion);
1943 }
1944 }
1945
1946 /*
1947 * Got it all?
1948 */
1949 if (!pszBiosImg)
1950 return RTMsgErrorExit(RTEXITCODE_SYNTAX, "--bios-image is required");
1951 if (!pszBiosMap)
1952 return RTMsgErrorExit(RTEXITCODE_SYNTAX, "--bios-map is required");
1953 if (!pszBiosSym)
1954 return RTMsgErrorExit(RTEXITCODE_SYNTAX, "--bios-sym is required");
1955
1956 /*
1957 * Do the job.
1958 */
1959 RTEXITCODE rcExit;
1960 rcExit = ReadBiosImage(pszBiosImg);
1961 if (rcExit == RTEXITCODE_SUCCESS)
1962 rcExit = ParseMapFile(pszBiosMap);
1963 if (rcExit == RTEXITCODE_SUCCESS)
1964 rcExit = ParseSymFile(pszBiosSym);
1965 if (rcExit == RTEXITCODE_SUCCESS)
1966 rcExit = OpenOutputFile(pszOutput);
1967 if (rcExit == RTEXITCODE_SUCCESS)
1968 rcExit = DisassembleBiosImage();
1969
1970 return rcExit;
1971}
1972
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette