You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

преди 18 години
преди 18 години
преди 18 години
преди 18 години
преди 18 години
преди 18 години
преди 18 години
преди 18 години
преди 18 години
преди 18 години
преди 18 години
преди 18 години
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528
  1. /*
  2. * libcucul Canvas for ultrafast compositing of Unicode letters
  3. * Copyright (c) 2002-2006 Sam Hocevar <sam@zoy.org>
  4. * All Rights Reserved
  5. *
  6. * $Id$
  7. *
  8. * This library is free software; you can redistribute it and/or
  9. * modify it under the terms of the Do What The Fuck You Want To
  10. * Public License, Version 2, as published by Sam Hocevar. See
  11. * http://sam.zoy.org/wtfpl/COPYING for more details.
  12. */
  13. /*
  14. * This file contains various import functions.
  15. */
  16. #include "config.h"
  17. #include "common.h"
  18. #if !defined(__KERNEL__)
  19. # if defined(HAVE_ERRNO_H)
  20. # include <errno.h>
  21. # endif
  22. # include <stdio.h>
  23. # include <stdlib.h>
  24. # include <string.h>
  25. #endif
  26. #include "cucul.h"
  27. #include "cucul_internals.h"
  28. /* ANSI Graphic Rendition Combination Mode */
  29. struct ansi_grcm
  30. {
  31. uint8_t fg, bg; /* ANSI-context fg/bg */
  32. uint8_t efg, ebg; /* Effective (libcucul) fg/bg */
  33. uint8_t bold, negative, concealed;
  34. };
  35. static cucul_canvas_t *import_caca(void const *, unsigned int);
  36. static cucul_canvas_t *import_text(void const *, unsigned int);
  37. static cucul_canvas_t *import_ansi(void const *, unsigned int, int);
  38. static void ansi_parse_grcm(cucul_canvas_t *, struct ansi_grcm *,
  39. unsigned int, unsigned int const *);
  40. /** \brief Import a buffer into a canvas
  41. *
  42. * Import a libcucul buffer as returned by cucul_load_memory()
  43. * or cucul_load_file() into an internal libcucul canvas.
  44. *
  45. * Valid values for \c format are:
  46. * - \c "": attempt to autodetect the file format.
  47. * - \c "text": import ASCII text files.
  48. * - \c "ansi": import ANSI files.
  49. * - \c "utf8": import UTF-8 files with ANSI colour codes.
  50. * - \c "caca": import native libcaca files.
  51. *
  52. * If an error occurs, NULL is returned and \b errno is set accordingly:
  53. * - \c ENOMEM Not enough memory to allocate canvas.
  54. * - \c EINVAL Invalid format requested.
  55. *
  56. * \param buffer A \e libcucul buffer containing the data to be loaded
  57. * into a canvas.
  58. * \param format A string describing the input format.
  59. * \return A libcucul canvas, or NULL in case of error.
  60. */
  61. cucul_canvas_t * cucul_import_canvas(cucul_buffer_t *buffer, char const *format)
  62. {
  63. char const *buf = (char const*)buffer->data;
  64. if(!strcasecmp("caca", format))
  65. return import_caca(buffer->data, buffer->size);
  66. if(!strcasecmp("utf8", format))
  67. return import_ansi(buffer->data, buffer->size, 1);
  68. if(!strcasecmp("text", format))
  69. return import_text(buffer->data, buffer->size);
  70. if(!strcasecmp("ansi", format))
  71. return import_ansi(buffer->data, buffer->size, 0);
  72. /* Autodetection */
  73. if(!strcasecmp("", format))
  74. {
  75. unsigned int i;
  76. /* If 4 first letters are CACA */
  77. if(buffer->size >= 4 &&
  78. buf[0] == 'C' && buf[1] == 'A' && buf[2] == 'C' && buf[3] != 'A')
  79. return import_caca(buffer->data, buffer->size);
  80. /* If we find ESC[ argv, we guess it's an ANSI file */
  81. for(i = 0; i + 1 < buffer->size; i++)
  82. if((buf[i] == 0x1b) && (buf[i + 1] == '['))
  83. return import_ansi(buffer->data, buffer->size, 0);
  84. /* Otherwise, import it as text */
  85. return import_text(buffer->data, buffer->size);
  86. }
  87. #if defined(HAVE_ERRNO_H)
  88. errno = EINVAL;
  89. #endif
  90. return NULL;
  91. }
  92. /** \brief Get available import formats
  93. *
  94. * Return a list of available import formats. The list is a NULL-terminated
  95. * array of strings, interleaving a string containing the internal value for
  96. * the import format, to be used with cucul_import_canvas(), and a string
  97. * containing the natural language description for that import format.
  98. *
  99. * This function never fails.
  100. *
  101. * \return An array of strings.
  102. */
  103. char const * const * cucul_get_import_list(void)
  104. {
  105. static char const * const list[] =
  106. {
  107. "", "autodetect",
  108. "text", "plain text",
  109. "caca", "native libcaca format",
  110. "ansi", "ANSI coloured text",
  111. NULL, NULL
  112. };
  113. return list;
  114. }
  115. /*
  116. * XXX: the following functions are local.
  117. */
  118. static cucul_canvas_t *import_caca(void const *data, unsigned int size)
  119. {
  120. cucul_canvas_t *cv;
  121. uint8_t const *buf = (uint8_t const *)data;
  122. unsigned int width, height, n;
  123. if(size < 16)
  124. goto invalid_caca;
  125. if(buf[0] != 'C' || buf[1] != 'A' || buf[2] != 'C' || buf[3] != 'A')
  126. goto invalid_caca;
  127. if(buf[4] != 'C' || buf[5] != 'A' || buf[6] != 'N' || buf[7] != 'V')
  128. goto invalid_caca;
  129. width = ((uint32_t)buf[8] << 24) | ((uint32_t)buf[9] << 16)
  130. | ((uint32_t)buf[10] << 8) | (uint32_t)buf[11];
  131. height = ((uint32_t)buf[12] << 24) | ((uint32_t)buf[13] << 16)
  132. | ((uint32_t)buf[14] << 8) | (uint32_t)buf[15];
  133. if(size != 16 + width * height * 8)
  134. goto invalid_caca;
  135. cv = cucul_create_canvas(width, height);
  136. if(!cv)
  137. {
  138. #if defined(HAVE_ERRNO_H)
  139. errno = ENOMEM;
  140. #endif
  141. return NULL;
  142. }
  143. for(n = height * width; n--; )
  144. {
  145. cv->chars[n] = ((uint32_t)buf[16 + 0 + 8 * n] << 24)
  146. | ((uint32_t)buf[16 + 1 + 8 * n] << 16)
  147. | ((uint32_t)buf[16 + 2 + 8 * n] << 8)
  148. | (uint32_t)buf[16 + 3 + 8 * n];
  149. cv->attr[n] = ((uint32_t)buf[16 + 4 + 8 * n] << 24)
  150. | ((uint32_t)buf[16 + 5 + 8 * n] << 16)
  151. | ((uint32_t)buf[16 + 6 + 8 * n] << 8)
  152. | (uint32_t)buf[16 + 7 + 8 * n];
  153. }
  154. return cv;
  155. invalid_caca:
  156. #if defined(HAVE_ERRNO_H)
  157. errno = EINVAL;
  158. #endif
  159. return NULL;
  160. }
  161. static cucul_canvas_t *import_text(void const *data, unsigned int size)
  162. {
  163. cucul_canvas_t *cv;
  164. char const *text = (char const *)data;
  165. unsigned int width = 0, height = 0, x = 0, y = 0, i;
  166. cv = cucul_create_canvas(width, height);
  167. if(!cv)
  168. {
  169. #if defined(HAVE_ERRNO_H)
  170. errno = ENOMEM;
  171. #endif
  172. return NULL;
  173. }
  174. cucul_set_color(cv, CUCUL_COLOR_DEFAULT, CUCUL_COLOR_TRANSPARENT);
  175. for(i = 0; i < size; i++)
  176. {
  177. unsigned char ch = *text++;
  178. if(ch == '\r')
  179. continue;
  180. if(ch == '\n')
  181. {
  182. x = 0;
  183. y++;
  184. continue;
  185. }
  186. if(x >= width || y >= height)
  187. {
  188. if(x >= width)
  189. width = x + 1;
  190. if(y >= height)
  191. height = y + 1;
  192. cucul_set_canvas_size(cv, width, height);
  193. }
  194. cucul_putchar(cv, x, y, ch);
  195. x++;
  196. }
  197. if(y > height)
  198. cucul_set_canvas_size(cv, width, height = y);
  199. return cv;
  200. }
  201. static cucul_canvas_t *import_ansi(void const *data, unsigned int size,
  202. int utf8)
  203. {
  204. struct ansi_grcm grcm;
  205. unsigned char const *buffer = (unsigned char const*)data;
  206. cucul_canvas_t *cv;
  207. unsigned int i, j, skip, dummy = 0;
  208. unsigned int width = 0, height = 0, wch = 1;
  209. unsigned long int ch;
  210. int x = 0, y = 0, save_x = 0, save_y = 0;
  211. cv = cucul_create_canvas(width, height);
  212. if(!cv)
  213. {
  214. #if defined(HAVE_ERRNO_H)
  215. errno = ENOMEM;
  216. #endif
  217. return NULL;
  218. }
  219. ansi_parse_grcm(cv, &grcm, 1, &dummy);
  220. for(i = 0; i < size; i += skip)
  221. {
  222. skip = 1;
  223. /* Wrap long lines */
  224. if((unsigned int)x >= 80)
  225. {
  226. x = 0;
  227. y++;
  228. }
  229. if(buffer[i] == '\x1a' && size - i >= 8
  230. && !memcmp(buffer + i + 1, "SAUCE00", 7))
  231. break; /* End before SAUCE data */
  232. if(buffer[i] == '\r')
  233. continue; /* DOS sucks */
  234. if(buffer[i] == '\n')
  235. {
  236. x = 0;
  237. y++;
  238. continue;
  239. }
  240. /* Interpret escape commands, as per Standard ECMA-48 "Control
  241. * Functions for Coded Character Sets", 5.4. Control sequences. */
  242. if(buffer[i] == '\x1b' && buffer[i + 1] == '[')
  243. {
  244. unsigned int argc = 0, argv[101];
  245. unsigned int param, inter, final;
  246. /* Compute offsets to parameter bytes, intermediate bytes and
  247. * to the final byte. Only the final byte is mandatory, there
  248. * can be zero of the others.
  249. * 0 param=2 inter final final+1
  250. * +-----+------------------+---------------------+-----------------+
  251. * | CSI | parameter bytes | intermediate bytes | final byte |
  252. * | | 0x30 - 0x3f | 0x20 - 0x2f | 0x40 - 0x7e |
  253. * | ^[[ | 0123456789:;<=>? | SPC !"#$%&'()*+,-./ | azAZ@[\]^_`{|}~ |
  254. * +-----+------------------+---------------------+-----------------+
  255. */
  256. param = 2;
  257. for(inter = param; i + inter < size; inter++)
  258. if(buffer[i + inter] < 0x30 || buffer[i + inter] > 0x3f)
  259. break;
  260. for(final = inter; i + final < size; final++)
  261. if(buffer[i + final] < 0x20 || buffer[i + final] > 0x2f)
  262. break;
  263. if(buffer[i + final] < 0x40 || buffer[i + final] > 0x7e)
  264. break; /* Invalid Final Byte */
  265. skip += final;
  266. /* Sanity checks */
  267. if(param < inter && buffer[i + param] >= 0x3c)
  268. {
  269. fprintf(stderr, "private sequence \"^[[%.*s\"\n",
  270. final - param + 1, buffer + i + param);
  271. continue; /* Private sequence, skip it entirely */
  272. }
  273. if(final - param > 100)
  274. continue; /* Suspiciously long sequence, skip it */
  275. /* Parse parameter bytes as per ECMA-48 5.4.2: Parameter string
  276. * format */
  277. if(param < inter)
  278. {
  279. argv[0] = 0;
  280. for(j = param; j < inter; j++)
  281. {
  282. if(buffer[i + j] == ';')
  283. argv[++argc] = 0;
  284. else if(buffer[i + j] >= '0' && buffer[i + j] <= '9')
  285. argv[argc] = 10 * argv[argc] + (buffer[i + j] - '0');
  286. }
  287. argc++;
  288. }
  289. /* Interpret final byte. The code representations are given in
  290. * ECMA-48 5.4: Control sequences, and the code definitions are
  291. * given in ECMA-48 8.3: Definition of control functions. */
  292. switch(buffer[i + final])
  293. {
  294. case 'f': /* CUP - Cursor Position */
  295. case 'H': /* HVP - Character And Line Position */
  296. x = (argc > 1 && argv[1] > 0) ? argv[1] - 1 : 0;
  297. y = (argc > 0 && argv[0] > 0) ? argv[0] - 1 : 0;
  298. break;
  299. case 'A': /* CUU - Cursor Up */
  300. y -= argc ? argv[0] : 1;
  301. if(y < 0)
  302. y = 0;
  303. break;
  304. case 'B': /* CUD - Cursor Down */
  305. y += argc ? argv[0] : 1;
  306. break;
  307. case 'C': /* CUF - Cursor Right */
  308. x += argc ? argv[0] : 1;
  309. break;
  310. case 'D': /* CUB - Cursor Left */
  311. x -= argc ? argv[0] : 1;
  312. if(x < 0)
  313. x = 0;
  314. break;
  315. case 's': /* Private (save cursor position) */
  316. save_x = x;
  317. save_y = y;
  318. break;
  319. case 'u': /* Private (reload cursor position) */
  320. x = save_x;
  321. y = save_y;
  322. break;
  323. case 'J': /* ED - Erase In Page */
  324. if(argv[0] == 2)
  325. x = y = 0;
  326. break;
  327. case 'K': /* EL - Erase In Line */
  328. if(width < 80)
  329. cucul_set_color(cv, CUCUL_COLOR_DEFAULT,
  330. CUCUL_COLOR_TRANSPARENT);
  331. cucul_set_canvas_size(cv, width = 80, height);
  332. for(j = x; j < 80; j++)
  333. cucul_putchar(cv, j, y, ' ');
  334. x = 80;
  335. break;
  336. case 'm': /* SGR - Select Graphic Rendition */
  337. ansi_parse_grcm(cv, &grcm, argc, argv);
  338. break;
  339. default:
  340. fprintf(stderr, "unknown command %c\n", buffer[i + final]);
  341. break;
  342. }
  343. continue;
  344. }
  345. /* Get the character we’re going to paste */
  346. if(utf8)
  347. {
  348. unsigned int bytes;
  349. ch = cucul_utf8_to_utf32((char const *)(buffer + i), &bytes);
  350. wch = cucul_utf32_is_fullwidth(ch) ? 2 : 1;
  351. skip += bytes - 1;
  352. }
  353. else
  354. {
  355. ch = cucul_cp437_to_utf32(buffer[i]);
  356. }
  357. /* Make sure the canvas is big enough. */
  358. if((unsigned int)x + wch > width)
  359. {
  360. cucul_set_color(cv, CUCUL_COLOR_DEFAULT, CUCUL_COLOR_TRANSPARENT);
  361. cucul_set_canvas_size(cv, width = x + wch, height);
  362. }
  363. if((unsigned int)y >= height)
  364. {
  365. cucul_set_color(cv, CUCUL_COLOR_DEFAULT, CUCUL_COLOR_TRANSPARENT);
  366. cucul_set_canvas_size(cv, width, height = y + 1);
  367. }
  368. /* Now paste our character */
  369. cucul_set_color(cv, grcm.efg, grcm.ebg);
  370. cucul_putchar(cv, x, y, ch);
  371. x += wch;
  372. }
  373. if((unsigned int)y > height)
  374. {
  375. cucul_set_color(cv, CUCUL_COLOR_DEFAULT, CUCUL_COLOR_TRANSPARENT);
  376. cucul_set_canvas_size(cv, width, height = y);
  377. }
  378. return cv;
  379. }
  380. /* XXX : ANSI loader helper */
  381. static void ansi_parse_grcm(cucul_canvas_t *cv, struct ansi_grcm *g,
  382. unsigned int argc, unsigned int const *argv)
  383. {
  384. static uint8_t const ansi2cucul[] =
  385. {
  386. CUCUL_COLOR_BLACK, CUCUL_COLOR_RED,
  387. CUCUL_COLOR_GREEN, CUCUL_COLOR_BROWN,
  388. CUCUL_COLOR_BLUE, CUCUL_COLOR_MAGENTA,
  389. CUCUL_COLOR_CYAN, CUCUL_COLOR_LIGHTGRAY
  390. };
  391. unsigned int j;
  392. for(j = 0; j < argc; j++)
  393. {
  394. /* Defined in ECMA-48 8.3.117: SGR - SELECT GRAPHIC RENDITION */
  395. if(argv[j] >= 30 && argv[j] <= 37)
  396. g->fg = ansi2cucul[argv[j] - 30];
  397. else if(argv[j] >= 40 && argv[j] <= 47)
  398. g->bg = ansi2cucul[argv[j] - 40];
  399. else if(argv[j] >= 90 && argv[j] <= 97)
  400. g->fg = ansi2cucul[argv[j] - 90] + 8;
  401. else if(argv[j] >= 100 && argv[j] <= 107)
  402. g->bg = ansi2cucul[argv[j] - 100] + 8;
  403. else switch(argv[j])
  404. {
  405. case 0: /* default rendition */
  406. g->fg = CUCUL_COLOR_DEFAULT;
  407. g->bg = CUCUL_COLOR_TRANSPARENT;
  408. g->bold = g->negative = g->concealed = 0;
  409. break;
  410. case 1: /* bold or increased intensity */
  411. g->bold = 1;
  412. break;
  413. case 4: /* singly underlined */
  414. break;
  415. case 5: /* slowly blinking (less then 150 per minute) */
  416. break;
  417. case 7: /* negative image */
  418. g->negative = 1;
  419. break;
  420. case 8: /* concealed characters */
  421. g->concealed = 1;
  422. break;
  423. case 22: /* normal colour or normal intensity (neither bold nor faint) */
  424. g->bold = 0;
  425. break;
  426. case 28: /* revealed characters */
  427. g->concealed = 0;
  428. break;
  429. case 39: /* default display colour (implementation-defined) */
  430. g->fg = CUCUL_COLOR_DEFAULT;
  431. break;
  432. case 49: /* default background colour (implementation-defined) */
  433. g->bg = CUCUL_COLOR_TRANSPARENT;
  434. break;
  435. default:
  436. fprintf(stderr, "unknown sgr %i\n", argv[j]);
  437. break;
  438. }
  439. }
  440. if(g->concealed)
  441. {
  442. g->efg = g->ebg = CUCUL_COLOR_TRANSPARENT;
  443. }
  444. else
  445. {
  446. g->efg = g->negative ? g->bg : g->fg;
  447. g->ebg = g->negative ? g->fg : g->bg;
  448. if(g->bold)
  449. {
  450. if(g->efg < 8)
  451. g->efg += 8;
  452. else if(g->efg == CUCUL_COLOR_DEFAULT)
  453. g->efg = CUCUL_COLOR_WHITE;
  454. }
  455. }
  456. }