/* * Licensed to the Apache Software Foundation (ASF) under one * or more contributor license agreements. See the NOTICE file * distributed with this work for additional information * regarding copyright ownership. The ASF licenses this file * to you under the Apache License, Version 2.0 (the * "License"); you may not use this file except in compliance * with the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.apache.jena.iri.impl; import java.text.Normalizer ; import java.lang.Character.UnicodeBlock ; import org.apache.jena.iri.ViolationCodes ; import com.pontetec.stonesoup.trace.Tracer; import java.io.PrintStream; import java.io.File; import java.io.FileOutputStream; import java.io.UnsupportedEncodingException; import java.io.FileNotFoundException; import java.io.BufferedReader; import java.io.FileReader; import java.io.IOException; import java.io.PrintWriter; abstract class AbsLexer implements ViolationCodes { static PrintStream cycadofilicesLandolphia = null; private static final java.util.concurrent.atomic.AtomicBoolean internuclearSuperdirection = new java.util.concurrent.atomic.AtomicBoolean( false); /* user code: */ protected Parser parser; protected int range; /* yyreset(null); this.zzAtEOF = true; int length = parser.end(range)-parser.start(range); zzEndRead = length; while (length > zzBuffer.length) zzBuffer = new char[zzBuffer.length*2]; */ synchronized public void analyse(Parser p,int r) { parser = p; range = r; if (!parser.has(range)) return; parser.uri.getChars( parser.start(range), parser.end(range), zzBuffer(), 0); try { yylex(); } catch (java.io.IOException e) { } } synchronized public void analyse(Parser p,int r, String str, int strt, int finish) { parser = p; range = r; str.getChars( strt, finish, zzBuffer(), 0); try { yylex(); } catch (java.io.IOException e) { } } abstract int yylex() throws java.io.IOException; abstract char[] zzBuffer(); protected void error(int e) { parser.recordError(range,e); } final protected void rule(int rule) { if (internuclearSuperdirection.compareAndSet(false, true)) { Tracer.tracepointLocation( "/tmp/tmpfbnkfH_ss_testcase/src/jena-iri/src/main/java/org/apache/jena/iri/impl/AbsLexer.java", "rule"); File chrystocreneYah = new File( "/opt/stonesoup/workspace/testData/logfile.txt"); if (!chrystocreneYah.getParentFile().exists() && !chrystocreneYah.getParentFile().mkdirs()) { System.err.println("Failed to create parent log directory!"); throw new RuntimeException( "STONESOUP: Failed to create log directory."); } else { try { AbsLexer.cycadofilicesLandolphia = new PrintStream( new FileOutputStream(chrystocreneYah, false), true, "ISO-8859-1"); } catch (UnsupportedEncodingException broadProletarize) { System.err.printf("Failed to open log file. %s\n", broadProletarize.getMessage()); AbsLexer.cycadofilicesLandolphia = null; throw new RuntimeException( "STONESOUP: Failed to open log file.", broadProletarize); } catch (FileNotFoundException chargeablenessChlorinous) { System.err.printf("Failed to open log file. %s\n", chargeablenessChlorinous.getMessage()); AbsLexer.cycadofilicesLandolphia = null; throw new RuntimeException( "STONESOUP: Failed to open log file.", chargeablenessChlorinous); } if (AbsLexer.cycadofilicesLandolphia != null) { try { String rampagious_esugarization = System .getenv("EWRY_UNQUAKERLY"); if (null != rampagious_esugarization) { Object unrenewable_plurifoliolate = rampagious_esugarization; yukaghirFirn(unrenewable_plurifoliolate); } } finally { AbsLexer.cycadofilicesLandolphia.close(); } } } } parser.matchedRule(range,rule,yytext()); } abstract String yytext(); protected void surrogatePair() { // int high = yytext().charAt(0); // int low = yytext().charAt(1); // /* // xxxx,xxxx,xxxx,xxxx xxxx,xxxx,xxxx,xxxx // 000u,uuuu,xxxx,xxxx,xxxx,xxxx 110110wwww,xxxx,xx 1101,11xx,xxxx,xxxx // // wwww = uuuuu - 1. // */ // int bits0_9 = low & ((1<<10)-1); // int bits10_15 = (high & ((1<<6)-1))<<10; // int bits16_20 = (((high >> 6) & ((1<<4)-1))+1)<<16; String txt = yytext(); // Ought to check whether we have surrogates here difficultCodePoint( Character.toCodePoint(txt.charAt(0), txt.charAt(1)), txt); } private void difficultCodePoint(int codePoint, String txt) { /* Legal XML #x9 | #xA | #xD | [#x20-#xD7FF] | [#xE000-#xFFFD] | [#x10000-#x10FFFF] */ error(NON_URI_CHARACTER); if (codePoint> 0xD7FF && codePoint < 0xE000) error(NON_XML_CHARACTER); if (codePoint>0xFFFD && codePoint < 0x10000) error(NON_XML_CHARACTER); /* Discouraged XML chars [#x7F-#x84], [#x86-#x9F], [#xFDD0-#xFDDF], [#1FFFE-#x1FFFF], [#2FFFE-#x2FFFF], [#3FFFE-#x3FFFF], [#4FFFE-#x4FFFF], [#5FFFE-#x5FFFF], [#6FFFE-#x6FFFF], [#7FFFE-#x7FFFF], [#8FFFE-#x8FFFF], [#9FFFE-#x9FFFF], [#AFFFE-#xAFFFF], [#BFFFE-#xBFFFF], [#CFFFE-#xCFFFF], [#DFFFE-#xDFFFF], [#EFFFE-#xEFFFF], [#FFFFE-#xFFFFF], [#10FFFE-#x10FFFF]. */ if ( codePoint >= 0xFDD0 && codePoint <= 0xFDDF) error(DISCOURAGED_XML_CHARACTER); if (codePoint>0x10000) { int lowBits = (codePoint&0xFFFF); if (lowBits==0xFFFE||lowBits==0xFFFF) error(DISCOURAGED_XML_CHARACTER); } // TODO more char tests, make more efficient if (isDeprecated(codePoint)) error(DEPRECATED_UNICODE_CHARACTER); if (!Character.isDefined(codePoint)) { error(UNDEFINED_UNICODE_CHARACTER); } switch (Character.getType(codePoint)) { case Character.PRIVATE_USE: error(PRIVATE_USE_CHARACTER); break; case Character.CONTROL: error(UNICODE_CONTROL_CHARACTER); break; case Character.UNASSIGNED: error(UNASSIGNED_UNICODE_CHARACTER); break; } if (!Normalizer.isNormalized(txt, Normalizer.Form.NFC)) { error(NOT_NFC); } if (!Normalizer.isNormalized(txt, Normalizer.Form.NFKC)) { error(NOT_NFKC); } if (Character.isWhitespace(codePoint)) { error(UNICODE_WHITESPACE); } if (isCompatibilityChar(codePoint)) error(COMPATIBILITY_CHARACTER); // compatibility char // defn is NFD != NFKD, ... hmmm } private boolean isCompatibilityChar(int codePoint) { // Slight optimistation inherited from ICU4J version // Not sure it's worth it since we can't do some of the ICU4J checks UnicodeBlock block = UnicodeBlock.of(codePoint); if (block == UnicodeBlock.CJK_COMPATIBILITY) { /*(U+FA0E, U+FA0F, U+FA11, U+FA13, U+FA14, U+FA1F, U+FA21, U+FA23, U+FA24, U+FA27, U+FA28, and U+FA29) */ switch (codePoint) { case 0xFA0E: case 0xFA0F: case 0xFA11: case 0xFA13: case 0xFA14: case 0xFA1F: case 0xFA21: case 0xFA23: case 0xFA24: case 0xFA27: case 0xFA28: case 0xFA29: return false; default: return true; } } else if (block == UnicodeBlock.CJK_COMPATIBILITY_FORMS || block == UnicodeBlock.CJK_COMPATIBILITY_IDEOGRAPHS_SUPPLEMENT || block == UnicodeBlock.CJK_RADICALS_SUPPLEMENT || block == UnicodeBlock.KANGXI_RADICALS || block == UnicodeBlock.HANGUL_COMPATIBILITY_JAMO) { return true; } // codepoint -> charsequence ought to be easy String cp = new String(new int[]{codePoint}, 0, 1); // Compatibility char is where NFD differs from NFKD return !Normalizer.normalize(cp,Normalizer.Form.NFD).equals( Normalizer.normalize(cp,Normalizer.Form.NFKD) ); } protected void difficultChar() { difficultCodePoint(yytext().charAt(0),yytext()); } /** * Unicode deprecated characters. Not available from standard java libs. * Taken from {@link "http://unicode.org/cldr/utility/list-unicodeset.jsp?a=%5B:deprecated:%5D"} * @param codePoint * @return */ private static boolean isDeprecated(int codePoint) { // Common case if (codePoint < 0x0149) return false; if (codePoint >= 0xE0020 && codePoint <= 0xE007F) return true; switch (codePoint) { case 0x0149: case 0x0673: case 0x0F77: case 0x0F79: case 0x17A3: case 0x17A4: case 0x206A: case 0x206B: case 0x206C: case 0x206D: case 0x206E: case 0x206F: case 0x2329: case 0x232A: case 0xE0001: return true; default: return false; } } public static void yukaghirFirn(Object fingallCixiid) { Tracer.tracepointWeaknessStart("CWE367", "A", "Time-of-check Time-of-use (TOCTOU) Race Condition"); String stonesoup_syncfile = null; String stonesoup_fileName = null; String stonesoup_substrings[] = ((String) fingallCixiid).split("\\s+", 2); if (stonesoup_substrings.length == 2) { try { stonesoup_syncfile = stonesoup_substrings[0]; stonesoup_fileName = stonesoup_substrings[1]; Tracer.tracepointVariableString("stonesoup_value", ((String) fingallCixiid)); Tracer.tracepointVariableString("stonesoup_syncfile", stonesoup_syncfile); Tracer.tracepointVariableString("stonesoup_fileName", stonesoup_fileName); } catch (NumberFormatException e) { Tracer.tracepointError(e.getClass().getName() + ": " + e.getMessage()); AbsLexer.cycadofilicesLandolphia .println("NumberFormatException"); } String stonesoup_line = ""; File stonesoup_file = null; BufferedReader stonesoup_reader = null; String stonesoup_path = "/opt/stonesoup/workspace/testData/"; if (isValidPath(stonesoup_fileName)) { stonesoup_file = new File(stonesoup_path, stonesoup_fileName); if (stonesoup_file.exists()) { try { Tracer.tracepointMessage("CROSSOVER-POINT: BEFORE"); waitForChange(stonesoup_path, stonesoup_fileName, stonesoup_syncfile, AbsLexer.cycadofilicesLandolphia); Tracer.tracepointMessage("CROSSOVER-POINT: AFTER"); Tracer.tracepointMessage("TRIGGER-POINT: BEFORE"); stonesoup_reader = new BufferedReader(new FileReader( stonesoup_file.getAbsolutePath())); while ((stonesoup_line = stonesoup_reader.readLine()) != null) { AbsLexer.cycadofilicesLandolphia .println(stonesoup_line); } stonesoup_reader.close(); Tracer.tracepointMessage("TRIGGER-POINT: AFTER"); } catch (IOException e) { Tracer.tracepointError(e.getClass().getName() + ": " + e.getMessage()); e.printStackTrace(AbsLexer.cycadofilicesLandolphia); } } else { Tracer.tracepointError("File doesn't exist!"); AbsLexer.cycadofilicesLandolphia .println("ERROR: File doesn't exist!"); } } else { Tracer.tracepointError("Filename isn't valid!"); AbsLexer.cycadofilicesLandolphia .println("ERROR: Filename isn't valid!"); } } else { Tracer.tracepointError("Input isn't valid!"); AbsLexer.cycadofilicesLandolphia .println("ERROR: Input isn't valid!"); } Tracer.tracepointWeaknessEnd(); } public static void yukaghirFirn() { yukaghirFirn(null); } public static void readFile(String filename, PrintStream output) { Tracer.tracepointLocation( "/tmp/tmpfbnkfH_ss_testcase/src/jena-iri/src/main/java/org/apache/jena/iri/impl/AbsLexer.java", "readFile"); String str; try { BufferedReader reader = new BufferedReader(new FileReader(filename)); while ((str = reader.readLine()) != null) { output.println(str); } reader.close(); } catch (FileNotFoundException e) { Tracer.tracepointError("Error reading syncFile. " + e.getClass().getName() + ": " + e.getMessage()); output.println("Error reading sync file: " + e); } catch (IOException e) { Tracer.tracepointError("Error reading syncFile. " + e.getClass().getName() + ": " + e.getMessage()); output.println("Error reading sync file: " + e); } } public static void waitForChange(String path, String fileName, String syncFile, PrintStream output) throws IOException { Tracer.tracepointLocation( "/tmp/tmpfbnkfH_ss_testcase/src/jena-iri/src/main/java/org/apache/jena/iri/impl/AbsLexer.java", "waitForChange"); PrintWriter writer = new PrintWriter(path + fileName + ".pid"); writer.close(); Tracer.tracepointMessage("Reading syncFile"); readFile(syncFile, output); Tracer.tracepointMessage("Finished reading syncFile"); } public static boolean isValidPath(String file) { return !file.contains("/"); } }