structuredtext.c 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373
  1. // Copyright (C) 2004-2025 Artifex Software, Inc.
  2. //
  3. // This file is part of MuPDF.
  4. //
  5. // MuPDF is free software: you can redistribute it and/or modify it under the
  6. // terms of the GNU Affero General Public License as published by the Free
  7. // Software Foundation, either version 3 of the License, or (at your option)
  8. // any later version.
  9. //
  10. // MuPDF is distributed in the hope that it will be useful, but WITHOUT ANY
  11. // WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
  12. // FOR A PARTICULAR PURPOSE. See the GNU Affero General Public License for more
  13. // details.
  14. //
  15. // You should have received a copy of the GNU Affero General Public License
  16. // along with MuPDF. If not, see <https://www.gnu.org/licenses/agpl-3.0.en.html>
  17. //
  18. // Alternative licensing terms are available from the licensor.
  19. // For commercial licensing, see <https://www.artifex.com/> or contact
  20. // Artifex Software, Inc., 39 Mesa Street, Suite 108A, San Francisco,
  21. // CA 94129, USA, for further information.
  22. /* StructuredText interface */
  23. JNIEXPORT void JNICALL
  24. FUN(StructuredText_finalize)(JNIEnv *env, jobject self)
  25. {
  26. fz_context *ctx = get_context(env);
  27. fz_stext_page *text = from_StructuredText_safe(env, self);
  28. if (!ctx || !text) return;
  29. (*env)->SetLongField(env, self, fid_StructuredText_pointer, 0);
  30. fz_drop_stext_page(ctx, text);
  31. }
  32. JNIEXPORT jobject JNICALL
  33. FUN(StructuredText_search)(JNIEnv *env, jobject self, jstring jneedle)
  34. {
  35. fz_context *ctx = get_context(env);
  36. fz_stext_page *text = from_StructuredText(env, self);
  37. const char *needle = NULL;
  38. search_state state = { env, NULL, 0 };
  39. if (!ctx || !text) return NULL;
  40. if (!jneedle) jni_throw_arg(env, "needle must not be null");
  41. needle = (*env)->GetStringUTFChars(env, jneedle, NULL);
  42. if (!needle) return NULL;
  43. state.hits = (*env)->NewObject(env, cls_ArrayList, mid_ArrayList_init);
  44. if (!state.hits || (*env)->ExceptionCheck(env)) return NULL;
  45. fz_try(ctx)
  46. fz_search_stext_page_cb(ctx, text, needle, hit_callback, &state);
  47. fz_always(ctx)
  48. (*env)->ReleaseStringUTFChars(env, jneedle, needle);
  49. fz_catch(ctx)
  50. jni_rethrow(env, ctx);
  51. if (state.error)
  52. return NULL;
  53. return (*env)->CallObjectMethod(env, state.hits, mid_ArrayList_toArray);
  54. }
  55. JNIEXPORT jobject JNICALL
  56. FUN(StructuredText_highlight)(JNIEnv *env, jobject self, jobject jpt1, jobject jpt2)
  57. {
  58. fz_context *ctx = get_context(env);
  59. fz_stext_page *text = from_StructuredText(env, self);
  60. fz_point pt1 = from_Point(env, jpt1);
  61. fz_point pt2 = from_Point(env, jpt2);
  62. fz_quad hits[1000];
  63. int n = 0;
  64. if (!ctx || !text) return NULL;
  65. fz_try(ctx)
  66. n = fz_highlight_selection(ctx, text, pt1, pt2, hits, nelem(hits));
  67. fz_catch(ctx)
  68. jni_rethrow(env, ctx);
  69. return to_QuadArray_safe(ctx, env, hits, n);
  70. }
  71. JNIEXPORT jobject JNICALL
  72. FUN(StructuredText_snapSelection)(JNIEnv *env, jobject self, jobject jpt1, jobject jpt2, jint mode)
  73. {
  74. fz_context *ctx = get_context(env);
  75. fz_stext_page *text = from_StructuredText(env, self);
  76. fz_point pt1 = from_Point(env, jpt1);
  77. fz_point pt2 = from_Point(env, jpt2);
  78. fz_quad quad;
  79. if (!ctx || !text) return NULL;
  80. fz_try(ctx)
  81. quad = fz_snap_selection(ctx, text, &pt1, &pt2, mode);
  82. fz_catch(ctx)
  83. jni_rethrow(env, ctx);
  84. (*env)->SetFloatField(env, jpt1, fid_Point_x, pt1.x);
  85. (*env)->SetFloatField(env, jpt1, fid_Point_y, pt1.y);
  86. (*env)->SetFloatField(env, jpt2, fid_Point_x, pt2.x);
  87. (*env)->SetFloatField(env, jpt2, fid_Point_y, pt2.y);
  88. return to_Quad_safe(ctx, env, quad);
  89. }
  90. JNIEXPORT jobject JNICALL
  91. FUN(StructuredText_copy)(JNIEnv *env, jobject self, jobject jpt1, jobject jpt2)
  92. {
  93. fz_context *ctx = get_context(env);
  94. fz_stext_page *text = from_StructuredText(env, self);
  95. fz_point pt1 = from_Point(env, jpt1);
  96. fz_point pt2 = from_Point(env, jpt2);
  97. jstring jstring = NULL;
  98. char *s = NULL;
  99. if (!ctx || !text) return NULL;
  100. fz_var(s);
  101. fz_try(ctx)
  102. {
  103. s = fz_copy_selection(ctx, text, pt1, pt2, 0);
  104. jstring = (*env)->NewStringUTF(env, s);
  105. }
  106. fz_always(ctx)
  107. fz_free(ctx, s);
  108. fz_catch(ctx)
  109. jni_rethrow(env, ctx);
  110. return jstring;
  111. }
  112. static void
  113. java_stext_walk(JNIEnv *env, fz_context *ctx, jobject walker, fz_stext_block *block)
  114. {
  115. fz_stext_line *line = NULL;
  116. fz_stext_char *ch = NULL;
  117. jobject jbbox = NULL;
  118. jobject jtrm = NULL;
  119. jobject jimage = NULL;
  120. jobject jdir = NULL;
  121. jobject jorigin = NULL;
  122. jobject jfont = NULL;
  123. jobject jquad = NULL;
  124. jobject jvecinfo = NULL;
  125. if (block == NULL)
  126. return; /* structured text has no blocks to walk */
  127. for (; block; block = block->next)
  128. {
  129. if (block->type == FZ_STEXT_BLOCK_IMAGE)
  130. {
  131. jbbox = to_Rect_safe(ctx, env, block->bbox);
  132. if (!jbbox) return;
  133. jtrm = to_Matrix_safe(ctx, env, block->u.i.transform);
  134. if (!jtrm) return;
  135. jimage = to_Image_safe(ctx, env, block->u.i.image);
  136. if (!jimage) return;
  137. (*env)->CallVoidMethod(env, walker, mid_StructuredTextWalker_onImageBlock, jbbox, jtrm, jimage);
  138. if ((*env)->ExceptionCheck(env)) return;
  139. (*env)->DeleteLocalRef(env, jbbox);
  140. (*env)->DeleteLocalRef(env, jimage);
  141. (*env)->DeleteLocalRef(env, jtrm);
  142. }
  143. else if (block->type == FZ_STEXT_BLOCK_TEXT)
  144. {
  145. jbbox = to_Rect_safe(ctx, env, block->bbox);
  146. if (!jbbox) return;
  147. (*env)->CallVoidMethod(env, walker, mid_StructuredTextWalker_beginTextBlock, jbbox);
  148. if ((*env)->ExceptionCheck(env)) return;
  149. (*env)->DeleteLocalRef(env, jbbox);
  150. for (line = block->u.t.first_line; line; line = line->next)
  151. {
  152. jbbox = to_Rect_safe(ctx, env, line->bbox);
  153. if (!jbbox) return;
  154. jdir = to_Point_safe(ctx, env, line->dir);
  155. if (!jdir) return;
  156. (*env)->CallVoidMethod(env, walker, mid_StructuredTextWalker_beginLine, jbbox, line->wmode, jdir);
  157. if ((*env)->ExceptionCheck(env)) return;
  158. (*env)->DeleteLocalRef(env, jdir);
  159. (*env)->DeleteLocalRef(env, jbbox);
  160. for (ch = line->first_char; ch; ch = ch->next)
  161. {
  162. jorigin = to_Point_safe(ctx, env, ch->origin);
  163. if (!jorigin) return;
  164. jfont = to_Font_safe(ctx, env, ch->font);
  165. if (!jfont) return;
  166. jquad = to_Quad_safe(ctx, env, ch->quad);
  167. if (!jquad) return;
  168. (*env)->CallVoidMethod(env, walker, mid_StructuredTextWalker_onChar,
  169. ch->c, jorigin, jfont, ch->size, jquad);
  170. if ((*env)->ExceptionCheck(env)) return;
  171. (*env)->DeleteLocalRef(env, jquad);
  172. (*env)->DeleteLocalRef(env, jfont);
  173. (*env)->DeleteLocalRef(env, jorigin);
  174. }
  175. (*env)->CallVoidMethod(env, walker, mid_StructuredTextWalker_endLine);
  176. if ((*env)->ExceptionCheck(env)) return;
  177. }
  178. (*env)->CallVoidMethod(env, walker, mid_StructuredTextWalker_endTextBlock);
  179. if ((*env)->ExceptionCheck(env)) return;
  180. }
  181. else if (block->type == FZ_STEXT_BLOCK_STRUCT)
  182. {
  183. jstring jstandard = to_String_safe(ctx, env, fz_structure_to_string(block->u.s.down->standard));
  184. if (!jstandard) return;
  185. jstring jraw = to_String_safe(ctx, env, block->u.s.down->raw);
  186. if (!jraw) return;
  187. (*env)->CallVoidMethod(env, walker, mid_StructuredTextWalker_beginStruct, jstandard, jraw, block->u.s.index);
  188. if ((*env)->ExceptionCheck(env)) return;
  189. (*env)->DeleteLocalRef(env, jraw);
  190. (*env)->DeleteLocalRef(env, jstandard);
  191. if (block->u.s.down)
  192. java_stext_walk(env, ctx, walker, block->u.s.down->first_block);
  193. (*env)->CallVoidMethod(env, walker, mid_StructuredTextWalker_endStruct);
  194. if ((*env)->ExceptionCheck(env)) return;
  195. }
  196. else if (block->type == FZ_STEXT_BLOCK_VECTOR)
  197. {
  198. jbbox = to_Rect_safe(ctx, env, block->bbox);
  199. if (!jbbox) return;
  200. jvecinfo = to_VectorInfo_safe(ctx, env, block->u.v.flags);
  201. if (!jvecinfo) return;
  202. (*env)->CallVoidMethod(env, walker, mid_StructuredTextWalker_onVector, jbbox, jvecinfo, block->u.v.argb);
  203. if ((*env)->ExceptionCheck(env)) return;
  204. (*env)->DeleteLocalRef(env, jvecinfo);
  205. (*env)->DeleteLocalRef(env, jbbox);
  206. }
  207. }
  208. }
  209. JNIEXPORT void JNICALL
  210. FUN(StructuredText_walk)(JNIEnv *env, jobject self, jobject walker)
  211. {
  212. fz_context *ctx = get_context(env);
  213. fz_stext_page *page = from_StructuredText(env, self);
  214. if (!ctx || !page) return;
  215. if (!walker) jni_throw_arg_void(env, "walker must not be null");
  216. java_stext_walk(env, ctx, walker, page->first_block);
  217. }
  218. JNIEXPORT jstring JNICALL
  219. FUN(StructuredText_asJSON)(JNIEnv *env, jobject self, jfloat scale)
  220. {
  221. fz_context *ctx = get_context(env);
  222. fz_stext_page *page = from_StructuredText(env, self);
  223. fz_output *out = NULL;
  224. fz_buffer *buf = NULL;
  225. char *str = NULL;
  226. if (!ctx || !page) return NULL;
  227. fz_var(buf);
  228. fz_var(out);
  229. fz_try(ctx)
  230. {
  231. buf = fz_new_buffer(ctx, 1024);
  232. out = fz_new_output_with_buffer(ctx, buf);
  233. fz_print_stext_page_as_json(ctx, out, page, scale);
  234. fz_close_output(ctx, out);
  235. fz_terminate_buffer(ctx, buf);
  236. (void)fz_buffer_extract(ctx, buf, (unsigned char**)&str);
  237. }
  238. fz_always(ctx)
  239. fz_drop_output(ctx, out);
  240. fz_catch(ctx)
  241. {
  242. fz_drop_buffer(ctx, buf);
  243. jni_rethrow(env, ctx);
  244. }
  245. return to_String_safe_own(ctx, env, str);
  246. }
  247. JNIEXPORT jstring JNICALL
  248. FUN(StructuredText_asHTML)(JNIEnv *env, jobject self, jint id)
  249. {
  250. fz_context *ctx = get_context(env);
  251. fz_stext_page *page = from_StructuredText(env, self);
  252. fz_output *out = NULL;
  253. fz_buffer *buf = NULL;
  254. char *str = NULL;
  255. if (!ctx || !page) return NULL;
  256. fz_var(buf);
  257. fz_var(out);
  258. fz_try(ctx)
  259. {
  260. buf = fz_new_buffer(ctx, 1024);
  261. out = fz_new_output_with_buffer(ctx, buf);
  262. fz_print_stext_page_as_html(ctx, out, page, id);
  263. fz_close_output(ctx, out);
  264. fz_terminate_buffer(ctx, buf);
  265. (void)fz_buffer_extract(ctx, buf, (unsigned char**)&str);
  266. }
  267. fz_always(ctx)
  268. fz_drop_output(ctx, out);
  269. fz_catch(ctx)
  270. {
  271. fz_drop_buffer(ctx, buf);
  272. jni_rethrow(env, ctx);
  273. }
  274. return to_String_safe_own(ctx, env, str);
  275. }
  276. JNIEXPORT jstring JNICALL
  277. FUN(StructuredText_asText)(JNIEnv *env, jobject self)
  278. {
  279. fz_context *ctx = get_context(env);
  280. fz_stext_page *page = from_StructuredText(env, self);
  281. fz_output *out = NULL;
  282. fz_buffer *buf = NULL;
  283. char *str = NULL;
  284. if (!ctx || !page) return NULL;
  285. fz_var(buf);
  286. fz_var(out);
  287. fz_try(ctx)
  288. {
  289. buf = fz_new_buffer(ctx, 1024);
  290. out = fz_new_output_with_buffer(ctx, buf);
  291. fz_print_stext_page_as_text(ctx, out, page);
  292. fz_close_output(ctx, out);
  293. fz_terminate_buffer(ctx, buf);
  294. (void)fz_buffer_extract(ctx, buf, (unsigned char**)&str);
  295. }
  296. fz_always(ctx)
  297. fz_drop_output(ctx, out);
  298. fz_catch(ctx)
  299. {
  300. fz_drop_buffer(ctx, buf);
  301. jni_rethrow(env, ctx);
  302. }
  303. return to_String_safe_own(ctx, env, str);
  304. }