Dave Jarvis' Repositories - keenquotes

M src/main/java/com/whitemagicsoftware/keenquotes/lex/Lexeme.java

   /**
    * Creates a new instance with a copy of {@link LexemeType} to prevent
    * subsequent mutations from affecting the resolution of ambiguous quotes.
+   *
    * @return A semi-deep copy of this instance.
    */
   public Lexeme copy() {
     return new Lexeme( mType.copy(), mBegan, mEnded );
+  }
   /**
    * Answers whether the given {@link LexemeType} is the same as this
    * instance's internal {@link LexemeType}.

M src/main/java/com/whitemagicsoftware/keenquotes/lex/LexemeType.java

   /**
    * Creates a new instance with a copy of {@link LexemeGlyph} to prevent
    * mutations by calling {@link #with(LexemeGlyph)} from affecting ambiguous
    * quotes resolution.
+   *
    * @return A semi-deep copy of this instance.
    */
   LexemeType copy() {
     return new LexemeType( glyph() );
+  }
   /**
    * Changes the type of glyph associated with this type of lexeme. This
    * is useful for passing along different glyphs represented by the same

M src/main/java/com/whitemagicsoftware/keenquotes/parser/AmbiguityResolver.java

    if( token.isType( QUOTE_OPENING_SINGLE ) ||
      token.isType( QUOTE_OPENING_DOUBLE ) ) {
      mTree = mTree.opening( token );
      mTree = mTree.opening( token.copy() );
    }
    // Close the subtree if it was open, try to close it.
    else if( token.isType( QUOTE_CLOSING_SINGLE ) ||
      token.isType( QUOTE_CLOSING_DOUBLE ) ) {
      mTree = mTree.closing( token );
      mTree = mTree.closing( token.copy() );
    }
    else if( token.isType( QUOTE_AMBIGUOUS_DOUBLE ) ) {
      // Create subtrees for: <" ... ">, <" ">, <"">, etc.
      if( mTree.hasOpeningDoubleQuote() ) {
        token.setTokenType( QUOTE_CLOSING_DOUBLE );
        mTree = mTree.closing( token );
        mTree = mTree.closing( token.copy() );
      }
      else {
        token.setTokenType( QUOTE_OPENING_DOUBLE );
        mTree = mTree.opening( token );
        mTree = mTree.opening( token.copy() );
      }
    }
    // Add ambiguous tokens to be resolved; add apostrophes for later emitting.
    else {
      mTree.add( token );
      mTree.add( token.copy() );
    }
  }

M src/main/java/com/whitemagicsoftware/keenquotes/parser/QuoteEmitter.java

      emit( QUOTE_OPENING_DOUBLE, lex2 );
    }
    else if( match( ANY, QUOTE_DOUBLE, ANY, ANY ) ) {
      emit( QUOTE_AMBIGUOUS_DOUBLE, lex2 );
    }
    // International opening double quotation mark.
    // International quotation marks.
    else if( match( ANY, QUOTE_DOUBLE_OPENING, ANY, ANY ) ) {
      emit( QUOTE_OPENING_DOUBLE, lex2 );
    }
    // International opening single quotation mark.
    else if( match( ANY, QUOTE_SINGLE_OPENING, ANY, ANY ) ) {
      emit( QUOTE_OPENING_SINGLE, lex2 );
    }
    // International double closing quotation mark.
    else if( match( ANY, ANY, ANY, QUOTE_DOUBLE_CLOSING ) ) {
      emit( QUOTE_CLOSING_DOUBLE, lex4 );
    else if( match( ANY, QUOTE_DOUBLE_CLOSING, ANY, ANY  ) ) {
      emit( QUOTE_CLOSING_DOUBLE, lex2 );
    }
    // International single closing quotation mark.
    else if( match( ANY, ANY, ANY, QUOTE_SINGLE_CLOSING ) ) {
      emit( QUOTE_CLOSING_SINGLE, lex4 );
    else if( match( ANY, QUOTE_SINGLE_CLOSING, ANY, ANY ) ) {
      emit( QUOTE_CLOSING_SINGLE, lex2 );
    }
    // Ambiguous (no match)
    else if( match( ANY, QUOTE_SINGLE, ANY, ANY ) ) {
      emit( QUOTE_AMBIGUOUS_SINGLE, lex2 );
    }
    else if( match( ANY, QUOTE_DOUBLE, ANY, ANY ) ) {
      emit( QUOTE_AMBIGUOUS_DOUBLE, lex2 );
    }
  }

M src/main/java/com/whitemagicsoftware/keenquotes/parser/Token.java

   /**
    * Creates a new instance with a copy of {@link Lexeme} to prevent
    * subsequent mutations from affecting the resolution of ambiguous quotes.
+   *
    * @return A semi-deep copy of this instance.
    */
   Token copy() {
     return new Token( mTokenType, mLexeme.copy() );
+  }
   /**
    * Answers whether this {@link Token} appears before the given {@link Token}
    * in the document. If they overlap, this will return {@code false}.

M src/test/resources/com/whitemagicsoftware/keenquotes/texts/i18n.txt

 # ########################################################################
 # Mixed
 # ########################################################################
 «What's ‹going› on?» ,,Hey there!"
 &laquo;What&apos;s &lsaquo;going&rsaquo; on?&raquo; &#8222;Hey there!&rdquo;
 # ########################################################################
 # French
 # ########################################################################

57	57	if( token.isType( QUOTE_OPENING_SINGLE ) \|\|
58	58	token.isType( QUOTE_OPENING_DOUBLE ) ) {
59		mTree = mTree.opening( token );
	59	mTree = mTree.opening( token.copy() );
60	60	}
61	61	// Close the subtree if it was open, try to close it.
62	62	else if( token.isType( QUOTE_CLOSING_SINGLE ) \|\|
63	63	token.isType( QUOTE_CLOSING_DOUBLE ) ) {
64		mTree = mTree.closing( token );
	64	mTree = mTree.closing( token.copy() );
65	65	}
66	66	else if( token.isType( QUOTE_AMBIGUOUS_DOUBLE ) ) {
67	67	// Create subtrees for: <" ... ">, <" ">, <"">, etc.
68	68	if( mTree.hasOpeningDoubleQuote() ) {
69	69	token.setTokenType( QUOTE_CLOSING_DOUBLE );
70		mTree = mTree.closing( token );
	70	mTree = mTree.closing( token.copy() );
71	71	}
72	72	else {
73	73	token.setTokenType( QUOTE_OPENING_DOUBLE );
74		mTree = mTree.opening( token );
	74	mTree = mTree.opening( token.copy() );
75	75	}
76	76	}
77	77	// Add ambiguous tokens to be resolved; add apostrophes for later emitting.
78	78	else {
79		mTree.add( token );
	79	mTree.add( token.copy() );
80	80	}
81	81	}

358	358	emit( QUOTE_OPENING_DOUBLE, lex2 );
359	359	}
360		else if( match( ANY, QUOTE_DOUBLE, ANY, ANY ) ) {
361		emit( QUOTE_AMBIGUOUS_DOUBLE, lex2 );
362		}
363		// International opening double quotation mark.
	360	// International quotation marks.
364	361	else if( match( ANY, QUOTE_DOUBLE_OPENING, ANY, ANY ) ) {
365	362	emit( QUOTE_OPENING_DOUBLE, lex2 );
366	363	}
367		// International opening single quotation mark.
368	364	else if( match( ANY, QUOTE_SINGLE_OPENING, ANY, ANY ) ) {
369	365	emit( QUOTE_OPENING_SINGLE, lex2 );
370	366	}
371		// International double closing quotation mark.
372		else if( match( ANY, ANY, ANY, QUOTE_DOUBLE_CLOSING ) ) {
373		emit( QUOTE_CLOSING_DOUBLE, lex4 );
	367	else if( match( ANY, QUOTE_DOUBLE_CLOSING, ANY, ANY ) ) {
	368	emit( QUOTE_CLOSING_DOUBLE, lex2 );
374	369	}
375		// International single closing quotation mark.
376		else if( match( ANY, ANY, ANY, QUOTE_SINGLE_CLOSING ) ) {
377		emit( QUOTE_CLOSING_SINGLE, lex4 );
	370	else if( match( ANY, QUOTE_SINGLE_CLOSING, ANY, ANY ) ) {
	371	emit( QUOTE_CLOSING_SINGLE, lex2 );
378	372	}
379	373	// Ambiguous (no match)
380	374	else if( match( ANY, QUOTE_SINGLE, ANY, ANY ) ) {
381	375	emit( QUOTE_AMBIGUOUS_SINGLE, lex2 );
	376	}
	377	else if( match( ANY, QUOTE_DOUBLE, ANY, ANY ) ) {
	378	emit( QUOTE_AMBIGUOUS_DOUBLE, lex2 );
382	379	}
383	380	}