pass.c 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764
  1. #include "l.h"
  2. void
  3. dodata(void)
  4. {
  5. int i;
  6. Sym *s;
  7. Prog *p;
  8. long t, u;
  9. if(debug['v'])
  10. Bprint(&bso, "%5.2f dodata\n", cputime());
  11. Bflush(&bso);
  12. for(p = datap; p != P; p = p->link) {
  13. s = p->from.sym;
  14. if(p->as == ADYNT || p->as == AINIT)
  15. s->value = dtype;
  16. if(s->type == SBSS)
  17. s->type = SDATA;
  18. if(s->type != SDATA)
  19. diag("initialize non-data (%d): %s\n%P",
  20. s->type, s->name, p);
  21. t = p->from.offset + p->width;
  22. if(t > s->value)
  23. diag("initialize bounds (%ld): %s\n%P",
  24. s->value, s->name, p);
  25. }
  26. /* allocate small guys */
  27. datsize = 0;
  28. for(i=0; i<NHASH; i++)
  29. for(s = hash[i]; s != S; s = s->link) {
  30. if(s->type != SDATA)
  31. if(s->type != SBSS)
  32. continue;
  33. t = s->value;
  34. if(t == 0) {
  35. diag("%s: no size", s->name);
  36. t = 1;
  37. }
  38. t = rnd(t, 4);;
  39. s->value = t;
  40. if(t > MINSIZ)
  41. continue;
  42. s->value = datsize;
  43. datsize += t;
  44. s->type = SDATA1;
  45. }
  46. /* allocate the rest of the data */
  47. for(i=0; i<NHASH; i++)
  48. for(s = hash[i]; s != S; s = s->link) {
  49. if(s->type != SDATA) {
  50. if(s->type == SDATA1)
  51. s->type = SDATA;
  52. continue;
  53. }
  54. t = s->value;
  55. s->value = datsize;
  56. datsize += t;
  57. }
  58. if(debug['j']) {
  59. /*
  60. * pad data with bss that fits up to next
  61. * 8k boundary, then push data to 8k
  62. */
  63. u = rnd(datsize, 8192);
  64. u -= datsize;
  65. for(i=0; i<NHASH; i++)
  66. for(s = hash[i]; s != S; s = s->link) {
  67. if(s->type != SBSS)
  68. continue;
  69. t = s->value;
  70. if(t > u)
  71. continue;
  72. u -= t;
  73. s->value = datsize;
  74. s->type = SDATA;
  75. datsize += t;
  76. }
  77. datsize += u;
  78. }
  79. /* now the bss */
  80. bsssize = 0;
  81. for(i=0; i<NHASH; i++)
  82. for(s = hash[i]; s != S; s = s->link) {
  83. if(s->type != SBSS)
  84. continue;
  85. t = s->value;
  86. s->value = bsssize + datsize;
  87. bsssize += t;
  88. }
  89. xdefine("edata", SBSS, datsize);
  90. xdefine("end", SBSS, bsssize + datsize);
  91. }
  92. Prog*
  93. brchain(Prog *p)
  94. {
  95. int i;
  96. for(i=0; i<20; i++) {
  97. if(p == P || p->as != AJMP)
  98. return p;
  99. p = p->pcond;
  100. }
  101. return P;
  102. }
  103. void
  104. follow(void)
  105. {
  106. if(debug['v'])
  107. Bprint(&bso, "%5.2f follow\n", cputime());
  108. Bflush(&bso);
  109. firstp = prg();
  110. lastp = firstp;
  111. xfol(textp);
  112. lastp->link = P;
  113. firstp = firstp->link;
  114. }
  115. void
  116. xfol(Prog *p)
  117. {
  118. Prog *q;
  119. int i;
  120. enum as a;
  121. loop:
  122. if(p == P)
  123. return;
  124. if(p->as == ATEXT)
  125. curtext = p;
  126. if(p->as == AJMP)
  127. if((q = p->pcond) != P) {
  128. p->mark = 1;
  129. p = q;
  130. if(p->mark == 0)
  131. goto loop;
  132. }
  133. if(p->mark) {
  134. /* copy up to 4 instructions to avoid branch */
  135. for(i=0,q=p; i<4; i++,q=q->link) {
  136. if(q == P)
  137. break;
  138. if(q == lastp)
  139. break;
  140. a = q->as;
  141. if(a == ANOP) {
  142. i--;
  143. continue;
  144. }
  145. switch(a) {
  146. case AJMP:
  147. case ARET:
  148. case AIRETL:
  149. case APUSHL:
  150. case APUSHFL:
  151. case APUSHW:
  152. case APUSHFW:
  153. case APOPL:
  154. case APOPFL:
  155. case APOPW:
  156. case APOPFW:
  157. goto brk;
  158. }
  159. if(q->pcond == P || q->pcond->mark)
  160. continue;
  161. if(a == ACALL || a == ALOOP)
  162. continue;
  163. for(;;) {
  164. if(p->as == ANOP) {
  165. p = p->link;
  166. continue;
  167. }
  168. q = copyp(p);
  169. p = p->link;
  170. q->mark = 1;
  171. lastp->link = q;
  172. lastp = q;
  173. if(q->as != a || q->pcond == P || q->pcond->mark)
  174. continue;
  175. q->as = relinv(q->as);
  176. p = q->pcond;
  177. q->pcond = q->link;
  178. q->link = p;
  179. xfol(q->link);
  180. p = q->link;
  181. if(p->mark)
  182. return;
  183. goto loop;
  184. }
  185. } /* */
  186. brk:;
  187. q = prg();
  188. q->as = AJMP;
  189. q->line = p->line;
  190. q->to.type = D_BRANCH;
  191. q->to.offset = p->pc;
  192. q->pcond = p;
  193. p = q;
  194. }
  195. p->mark = 1;
  196. lastp->link = p;
  197. lastp = p;
  198. a = p->as;
  199. if(a == AJMP || a == ARET || a == AIRETL)
  200. return;
  201. if(p->pcond != P)
  202. if(a != ACALL) {
  203. q = brchain(p->link);
  204. if(q != P && q->mark)
  205. if(a != ALOOP) {
  206. p->as = relinv(a);
  207. p->link = p->pcond;
  208. p->pcond = q;
  209. }
  210. xfol(p->link);
  211. q = brchain(p->pcond);
  212. if(q->mark) {
  213. p->pcond = q;
  214. return;
  215. }
  216. p = q;
  217. goto loop;
  218. }
  219. p = p->link;
  220. goto loop;
  221. }
  222. int
  223. relinv(int a)
  224. {
  225. switch(a) {
  226. case AJEQ: return AJNE;
  227. case AJNE: return AJEQ;
  228. case AJLE: return AJGT;
  229. case AJLS: return AJHI;
  230. case AJLT: return AJGE;
  231. case AJMI: return AJPL;
  232. case AJGE: return AJLT;
  233. case AJPL: return AJMI;
  234. case AJGT: return AJLE;
  235. case AJHI: return AJLS;
  236. case AJCS: return AJCC;
  237. case AJCC: return AJCS;
  238. case AJPS: return AJPC;
  239. case AJPC: return AJPS;
  240. case AJOS: return AJOC;
  241. case AJOC: return AJOS;
  242. }
  243. diag("unknown relation: %s in %s", anames[a], TNAME);
  244. return a;
  245. }
  246. void
  247. doinit(void)
  248. {
  249. Sym *s;
  250. Prog *p;
  251. int x;
  252. for(p = datap; p != P; p = p->link) {
  253. x = p->to.type;
  254. if(x != D_EXTERN && x != D_STATIC)
  255. continue;
  256. s = p->to.sym;
  257. if(s->type == 0 || s->type == SXREF)
  258. diag("undefined %s initializer of %s",
  259. s->name, p->from.sym->name);
  260. p->to.offset += s->value;
  261. p->to.type = D_CONST;
  262. if(s->type == SDATA || s->type == SBSS)
  263. p->to.offset += INITDAT;
  264. }
  265. }
  266. void
  267. patch(void)
  268. {
  269. long c;
  270. Prog *p, *q;
  271. Sym *s;
  272. long vexit;
  273. if(debug['v'])
  274. Bprint(&bso, "%5.2f mkfwd\n", cputime());
  275. Bflush(&bso);
  276. mkfwd();
  277. if(debug['v'])
  278. Bprint(&bso, "%5.2f patch\n", cputime());
  279. Bflush(&bso);
  280. s = lookup("exit", 0);
  281. vexit = s->value;
  282. for(p = firstp; p != P; p = p->link) {
  283. if(p->as == ATEXT)
  284. curtext = p;
  285. if(p->as == ACALL || p->as == ARET) {
  286. s = p->to.sym;
  287. if(s) {
  288. if(debug['c'])
  289. Bprint(&bso, "%s calls %s\n", TNAME, s->name);
  290. switch(s->type) {
  291. default:
  292. diag("undefined: %s in %s", s->name, TNAME);
  293. s->type = STEXT;
  294. s->value = vexit;
  295. break; /* or fall through to set offset? */
  296. case STEXT:
  297. p->to.offset = s->value;
  298. break;
  299. case SUNDEF:
  300. p->pcond = UP;
  301. p->to.offset = 0;
  302. break;
  303. }
  304. p->to.type = D_BRANCH;
  305. }
  306. }
  307. if(p->to.type != D_BRANCH || p->pcond == UP)
  308. continue;
  309. c = p->to.offset;
  310. for(q = firstp; q != P;) {
  311. if(q->forwd != P)
  312. if(c >= q->forwd->pc) {
  313. q = q->forwd;
  314. continue;
  315. }
  316. if(c == q->pc)
  317. break;
  318. q = q->link;
  319. }
  320. if(q == P) {
  321. diag("branch out of range in %s\n%P", TNAME, p);
  322. p->to.type = D_NONE;
  323. }
  324. p->pcond = q;
  325. }
  326. for(p = firstp; p != P; p = p->link) {
  327. if(p->as == ATEXT)
  328. curtext = p;
  329. p->mark = 0; /* initialization for follow */
  330. if(p->pcond != P && p->pcond != UP) {
  331. p->pcond = brloop(p->pcond);
  332. if(p->pcond != P)
  333. if(p->to.type == D_BRANCH)
  334. p->to.offset = p->pcond->pc;
  335. }
  336. }
  337. }
  338. #define LOG 5
  339. void
  340. mkfwd(void)
  341. {
  342. Prog *p;
  343. int i;
  344. long dwn[LOG], cnt[LOG];
  345. Prog *lst[LOG];
  346. for(i=0; i<LOG; i++) {
  347. if(i == 0)
  348. cnt[i] = 1; else
  349. cnt[i] = LOG * cnt[i-1];
  350. dwn[i] = 1;
  351. lst[i] = P;
  352. }
  353. i = 0;
  354. for(p = firstp; p != P; p = p->link) {
  355. if(p->as == ATEXT)
  356. curtext = p;
  357. i--;
  358. if(i < 0)
  359. i = LOG-1;
  360. p->forwd = P;
  361. dwn[i]--;
  362. if(dwn[i] <= 0) {
  363. dwn[i] = cnt[i];
  364. if(lst[i] != P)
  365. lst[i]->forwd = p;
  366. lst[i] = p;
  367. }
  368. }
  369. }
  370. Prog*
  371. brloop(Prog *p)
  372. {
  373. int c;
  374. Prog *q;
  375. c = 0;
  376. for(q = p; q != P; q = q->pcond) {
  377. if(q->as != AJMP)
  378. break;
  379. c++;
  380. if(c >= 5000)
  381. return P;
  382. }
  383. return q;
  384. }
  385. void
  386. dostkoff(void)
  387. {
  388. Prog *p, *q;
  389. long autoffset, deltasp;
  390. int a, f, curframe, curbecome, maxbecome;
  391. curframe = 0;
  392. curbecome = 0;
  393. maxbecome = 0;
  394. curtext = 0;
  395. for(p = firstp; p != P; p = p->link) {
  396. /* find out how much arg space is used in this TEXT */
  397. if(p->to.type == (D_INDIR+D_SP))
  398. if(p->to.offset > curframe)
  399. curframe = p->to.offset;
  400. switch(p->as) {
  401. case ATEXT:
  402. if(curtext && curtext->from.sym) {
  403. curtext->from.sym->frame = curframe;
  404. curtext->from.sym->become = curbecome;
  405. if(curbecome > maxbecome)
  406. maxbecome = curbecome;
  407. }
  408. curframe = 0;
  409. curbecome = 0;
  410. curtext = p;
  411. break;
  412. case ARET:
  413. /* special form of RET is BECOME */
  414. if(p->from.type == D_CONST)
  415. if(p->from.offset > curbecome)
  416. curbecome = p->from.offset;
  417. break;
  418. }
  419. }
  420. if(curtext && curtext->from.sym) {
  421. curtext->from.sym->frame = curframe;
  422. curtext->from.sym->become = curbecome;
  423. if(curbecome > maxbecome)
  424. maxbecome = curbecome;
  425. }
  426. if(debug['b'])
  427. print("max become = %d\n", maxbecome);
  428. xdefine("ALEFbecome", STEXT, maxbecome);
  429. curtext = 0;
  430. for(p = firstp; p != P; p = p->link) {
  431. switch(p->as) {
  432. case ATEXT:
  433. curtext = p;
  434. break;
  435. case ACALL:
  436. if(curtext != P && curtext->from.sym != S && curtext->to.offset >= 0) {
  437. f = maxbecome - curtext->from.sym->frame;
  438. if(f <= 0)
  439. break;
  440. /* calling a become or calling a variable */
  441. if(p->to.sym == S || p->to.sym->become) {
  442. curtext->to.offset += f;
  443. if(debug['b']) {
  444. curp = p;
  445. print("%D calling %D increase %d\n",
  446. &curtext->from, &p->to, f);
  447. }
  448. }
  449. }
  450. break;
  451. }
  452. }
  453. autoffset = 0;
  454. deltasp = 0;
  455. for(p = firstp; p != P; p = p->link) {
  456. if(p->as == ATEXT) {
  457. curtext = p;
  458. autoffset = p->to.offset;
  459. if(autoffset < 0)
  460. autoffset = 0;
  461. if(autoffset) {
  462. p = appendp(p);
  463. p->as = AADJSP;
  464. p->from.type = D_CONST;
  465. p->from.offset = autoffset;
  466. }
  467. deltasp = autoffset;
  468. }
  469. a = p->from.type;
  470. if(a == D_AUTO)
  471. p->from.offset += deltasp;
  472. if(a == D_PARAM)
  473. p->from.offset += deltasp + 4;
  474. a = p->to.type;
  475. if(a == D_AUTO)
  476. p->to.offset += deltasp;
  477. if(a == D_PARAM)
  478. p->to.offset += deltasp + 4;
  479. switch(p->as) {
  480. default:
  481. continue;
  482. case APUSHL:
  483. case APUSHFL:
  484. deltasp += 4;
  485. continue;
  486. case APUSHW:
  487. case APUSHFW:
  488. deltasp += 2;
  489. continue;
  490. case APOPL:
  491. case APOPFL:
  492. deltasp -= 4;
  493. continue;
  494. case APOPW:
  495. case APOPFW:
  496. deltasp -= 2;
  497. continue;
  498. case ARET:
  499. break;
  500. }
  501. if(autoffset != deltasp)
  502. diag("unbalanced PUSH/POP");
  503. if(p->from.type == D_CONST)
  504. goto become;
  505. if(autoffset) {
  506. q = p;
  507. p = appendp(p);
  508. p->as = ARET;
  509. q->as = AADJSP;
  510. q->from.type = D_CONST;
  511. q->from.offset = -autoffset;
  512. }
  513. continue;
  514. become:
  515. q = p;
  516. p = appendp(p);
  517. p->as = AJMP;
  518. p->to = q->to;
  519. p->pcond = q->pcond;
  520. q->as = AADJSP;
  521. q->from = zprg.from;
  522. q->from.type = D_CONST;
  523. q->from.offset = -autoffset;
  524. q->to = zprg.to;
  525. continue;
  526. }
  527. }
  528. long
  529. atolwhex(char *s)
  530. {
  531. long n;
  532. int f;
  533. n = 0;
  534. f = 0;
  535. while(*s == ' ' || *s == '\t')
  536. s++;
  537. if(*s == '-' || *s == '+') {
  538. if(*s++ == '-')
  539. f = 1;
  540. while(*s == ' ' || *s == '\t')
  541. s++;
  542. }
  543. if(s[0]=='0' && s[1]){
  544. if(s[1]=='x' || s[1]=='X'){
  545. s += 2;
  546. for(;;){
  547. if(*s >= '0' && *s <= '9')
  548. n = n*16 + *s++ - '0';
  549. else if(*s >= 'a' && *s <= 'f')
  550. n = n*16 + *s++ - 'a' + 10;
  551. else if(*s >= 'A' && *s <= 'F')
  552. n = n*16 + *s++ - 'A' + 10;
  553. else
  554. break;
  555. }
  556. } else
  557. while(*s >= '0' && *s <= '7')
  558. n = n*8 + *s++ - '0';
  559. } else
  560. while(*s >= '0' && *s <= '9')
  561. n = n*10 + *s++ - '0';
  562. if(f)
  563. n = -n;
  564. return n;
  565. }
  566. void
  567. undef(void)
  568. {
  569. int i;
  570. Sym *s;
  571. for(i=0; i<NHASH; i++)
  572. for(s = hash[i]; s != S; s = s->link)
  573. if(s->type == SXREF)
  574. diag("%s: not defined", s->name);
  575. }
  576. void
  577. import(void)
  578. {
  579. int i;
  580. Sym *s;
  581. for(i = 0; i < NHASH; i++)
  582. for(s = hash[i]; s != S; s = s->link)
  583. if(s->sig != 0 && s->type == SXREF && (nimports == 0 || s->subtype == SIMPORT)){
  584. if(s->value != 0)
  585. diag("value != 0 on SXREF");
  586. undefsym(s);
  587. if(debug['X'])
  588. Bprint(&bso, "IMPORT: %s sig=%lux v=%ld\n", s->name, s->sig, s->value);
  589. if(debug['S'])
  590. s->sig = 0;
  591. }
  592. }
  593. void
  594. ckoff(Sym *s, long v)
  595. {
  596. if(v < 0 || v >= 1<<Roffset)
  597. diag("relocation offset %ld for %s out of range", v, s->name);
  598. }
  599. static Prog*
  600. newdata(Sym *s, int o, int w, int t)
  601. {
  602. Prog *p;
  603. p = prg();
  604. if(edatap == P)
  605. datap = p;
  606. else
  607. edatap->link = p;
  608. edatap = p;
  609. p->as = ADATA;
  610. p->width = w;
  611. p->from.scale = w;
  612. p->from.type = t;
  613. p->from.sym = s;
  614. p->from.offset = o;
  615. p->to.type = D_CONST;
  616. return p;
  617. }
  618. void
  619. export(void)
  620. {
  621. int i, j, n, off, nb, sv, ne;
  622. Sym *s, *et, *str, **esyms;
  623. Prog *p;
  624. char buf[NSNAME], *t;
  625. n = 0;
  626. for(i = 0; i < NHASH; i++)
  627. for(s = hash[i]; s != S; s = s->link)
  628. if(s->sig != 0 && s->type != SXREF && s->type != SUNDEF && (nexports == 0 || s->subtype == SEXPORT))
  629. n++;
  630. esyms = malloc(n*sizeof(Sym*));
  631. ne = n;
  632. n = 0;
  633. for(i = 0; i < NHASH; i++)
  634. for(s = hash[i]; s != S; s = s->link)
  635. if(s->sig != 0 && s->type != SXREF && s->type != SUNDEF && (nexports == 0 || s->subtype == SEXPORT))
  636. esyms[n++] = s;
  637. for(i = 0; i < ne-1; i++)
  638. for(j = i+1; j < ne; j++)
  639. if(strcmp(esyms[i]->name, esyms[j]->name) > 0){
  640. s = esyms[i];
  641. esyms[i] = esyms[j];
  642. esyms[j] = s;
  643. }
  644. nb = 0;
  645. off = 0;
  646. et = lookup(EXPTAB, 0);
  647. if(et->type != 0 && et->type != SXREF)
  648. diag("%s already defined", EXPTAB);
  649. et->type = SDATA;
  650. str = lookup(".string", 0);
  651. if(str->type == 0)
  652. str->type = SDATA;
  653. sv = str->value;
  654. for(i = 0; i < ne; i++){
  655. s = esyms[i];
  656. if(debug['S'])
  657. s->sig = 0;
  658. /* Bprint(&bso, "EXPORT: %s sig=%lux t=%d\n", s->name, s->sig, s->type); */
  659. /* signature */
  660. p = newdata(et, off, sizeof(long), D_EXTERN);
  661. off += sizeof(long);
  662. p->to.offset = s->sig;
  663. /* address */
  664. p = newdata(et, off, sizeof(long), D_EXTERN);
  665. off += sizeof(long);
  666. p->to.type = D_ADDR;
  667. p->to.index = D_EXTERN;
  668. p->to.sym = s;
  669. /* string */
  670. t = s->name;
  671. n = strlen(t)+1;
  672. for(;;){
  673. buf[nb++] = *t;
  674. sv++;
  675. if(nb >= NSNAME){
  676. p = newdata(str, sv-NSNAME, NSNAME, D_STATIC);
  677. p->to.type = D_SCONST;
  678. memmove(p->to.scon, buf, NSNAME);
  679. nb = 0;
  680. }
  681. if(*t++ == 0)
  682. break;
  683. }
  684. /* name */
  685. p = newdata(et, off, sizeof(long), D_EXTERN);
  686. off += sizeof(long);
  687. p->to.type = D_ADDR;
  688. p->to.index = D_STATIC;
  689. p->to.sym = str;
  690. p->to.offset = sv-n;
  691. }
  692. if(nb > 0){
  693. p = newdata(str, sv-nb, nb, D_STATIC);
  694. p->to.type = D_SCONST;
  695. memmove(p->to.scon, buf, nb);
  696. }
  697. for(i = 0; i < 3; i++){
  698. newdata(et, off, sizeof(long), D_EXTERN);
  699. off += sizeof(long);
  700. }
  701. et->value = off;
  702. if(sv == 0)
  703. sv = 1;
  704. str->value = sv;
  705. exports = ne;
  706. free(esyms);
  707. }