@@ -226,6 +226,49 @@ Portions Copyright (c) 2017-2018, Chris Fraire <
[email protected] >.
226
226
<quiet >false</quiet >
227
227
</configuration >
228
228
</execution >
229
+ <execution >
230
+ <!-- patches jflex generated files to stop increasing buffer beyond token size that lucene accepts
231
+ https://github.com/OpenGrok/OpenGrok/issues/1170 make parsers stop producing tokens > 32766 chars
232
+ at least for PlainFullTokenizer, PlainSymbolTokenizer, JavaScriptSymbolTokenizer, JavaSymbolTokenizer
233
+ use below
234
+ -->
235
+ <id >replace-in-jflex-sources</id >
236
+ <phase >generate-sources</phase >
237
+ <goals >
238
+ <goal >replace</goal >
239
+ </goals >
240
+ <configuration >
241
+ <filesToInclude >
242
+ ${basedir} /target/generated-sources/jflex/org/opengrok/indexer/analysis/java/JavaSymbolTokenizer.java,${basedir} /target/generated-sources/jflex/org/opengrok/indexer/analysis/javascript/JavaScriptSymbolTokenizer.java,${basedir} /target/generated-sources/jflex/org/opengrok/indexer/analysis/plain/PlainFullTokenizer.java,${basedir} /target/generated-sources/jflex/org/opengrok/indexer/analysis/plain/PlainSymbolTokenizer.java
243
+ </filesToInclude >
244
+ <replacements >
245
+ <replacement >
246
+ <token >private static final int ZZ_BUFFERSIZE =</token >
247
+ <value >private int ZZ_BUFFERSIZE =</value >
248
+ </replacement >
249
+ <replacement >
250
+ <token >int requested = zzBuffer\.length - zzEndRead;</token >
251
+ <value >int requested = zzBuffer.length - zzEndRead - zzFinalHighSurrogate;</value >
252
+ </replacement >
253
+ <replacement >
254
+ <token >(zzFinalHighSurrogate = 1;)(\r?\n)</token >
255
+ <value >$1$2 if (numRead == 1) { return true; }$2</value >
256
+ </replacement >
257
+ <replacement >
258
+ <token >[ \t]*/\* is the buffer big enough\? \*/\s+if \(zzCurrentPos >= zzBuffer\.length.*?\}[ \t]*\r?\n</token >
259
+ <value ></value >
260
+ </replacement >
261
+ <!-- also revert 0 character check that got in with 1.6.1 : https://github.com/jflex-de/jflex/blob/master/jflex/examples/zero-reader/README.md -->
262
+ <replacement >
263
+ <token >[ \t]*/\* not supposed to occur according to specification of java\.io\.Reader \*/\s+if \(numRead == 0.*?\}[ \t]*\r?\n</token >
264
+ <value ></value >
265
+ </replacement >
266
+ </replacements >
267
+ <regexFlags >
268
+ <regexFlag >DOTALL</regexFlag >
269
+ </regexFlags >
270
+ </configuration >
271
+ </execution >
229
272
</executions >
230
273
</plugin >
231
274
<plugin >
@@ -271,60 +314,7 @@ Portions Copyright (c) 2017-2018, Chris Fraire <
[email protected] >.
271
314
</executions >
272
315
</plugin >
273
316
274
- <!-- patches jflex generated files to stop increasing buffer beyond token size that lucene accepts
275
- https://github.com/OpenGrok/OpenGrok/issues/1170 make parsers stop producing tokens > 32766 chars
276
- at least for PlainFullTokenizer, PlainSymbolTokenizer, JavaScriptSymbolTokenizer, JavaSymbolTokenizer
277
- use below
278
- -->
279
-
280
- <plugin >
281
- <groupId >com.google.code.maven-replacer-plugin</groupId >
282
- <artifactId >replacer</artifactId >
283
- <version >1.5.3</version >
284
- <executions >
285
- <execution >
286
- <id >replace-in-jflex-sources</id >
287
- <phase >generate-sources</phase >
288
- <goals >
289
- <goal >replace</goal >
290
- </goals >
291
- </execution >
292
- </executions >
293
- <configuration >
294
- <filesToInclude >
295
- ${basedir} /target/generated-sources/jflex/org/opengrok/indexer/analysis/java/JavaSymbolTokenizer.java,${basedir} /target/generated-sources/jflex/org/opengrok/indexer/analysis/javascript/JavaScriptSymbolTokenizer.java,${basedir} /target/generated-sources/jflex/org/opengrok/indexer/analysis/plain/PlainFullTokenizer.java,${basedir} /target/generated-sources/jflex/org/opengrok/indexer/analysis/plain/PlainSymbolTokenizer.java
296
- </filesToInclude >
297
- <replacements >
298
- <replacement >
299
- <token >private static final int ZZ_BUFFERSIZE =</token >
300
- <value >private int ZZ_BUFFERSIZE =</value >
301
- </replacement >
302
- <replacement >
303
- <token >int requested = zzBuffer\.length - zzEndRead;</token >
304
- <value >int requested = zzBuffer.length - zzEndRead - zzFinalHighSurrogate;</value >
305
- </replacement >
306
- <replacement >
307
- <token >(zzFinalHighSurrogate = 1;)(\r?\n)</token >
308
- <value >$1$2 if (numRead == 1) { return true; }$2</value >
309
- </replacement >
310
-
311
- <replacement >
312
- <token >[ \t]*/\* is the buffer big enough\? \*/\s+if \(zzCurrentPos >= zzBuffer\.length.*?\}[ \t]*\r?\n</token >
313
- <value ></value >
314
- </replacement >
315
- <!-- also revert 0 character check that got in with 1.6.1 : https://github.com/jflex-de/jflex/blob/master/jflex/examples/zero-reader/README.md -->
316
- <replacement >
317
- <token >[ \t]*/\* not supposed to occur according to specification of java\.io\.Reader \*/\s+if \(numRead == 0.*?\}[ \t]*\r?\n</token >
318
- <value ></value >
319
- </replacement >
320
- </replacements >
321
- <regexFlags >
322
- <regexFlag >DOTALL</regexFlag >
323
- </regexFlags >
324
- </configuration >
325
- </plugin >
326
-
327
- <plugin >
317
+ <plugin >
328
318
<groupId >org.apache.maven.plugins</groupId >
329
319
<artifactId >maven-antrun-plugin</artifactId >
330
320
<version >1.8</version >
0 commit comments