Merge pull request #212 from simonvbrae/feature/rdfstar_parsing

RubenVerborgh · web-flow · commit 3016dbd003c2 · 2020-07-27T00:07:02.000+02:00
Added parsing for RDF* syntax
diff --git a/src/N3Lexer.js b/src/N3Lexer.js
@@ -39,9 +39,9 @@ export default class N3Lexer {
     this._simpleApostropheString = /^'([^'\\\r\n]*)'(?=[^'])/;
     this._langcode = /^@([a-z]+(?:-[a-z0-9]+)*)(?=[^a-z0-9\-])/i;
     this._prefix = /^((?:[A-Za-z\xc0-\xd6\xd8-\xf6\xf8-\u02ff\u0370-\u037d\u037f-\u1fff\u200c\u200d\u2070-\u218f\u2c00-\u2fef\u3001-\ud7ff\uf900-\ufdcf\ufdf0-\ufffd]|[\ud800-\udb7f][\udc00-\udfff])(?:\.?[\-0-9A-Z_a-z\xb7\xc0-\xd6\xd8-\xf6\xf8-\u037d\u037f-\u1fff\u200c\u200d\u203f\u2040\u2070-\u218f\u2c00-\u2fef\u3001-\ud7ff\uf900-\ufdcf\ufdf0-\ufffd]|[\ud800-\udb7f][\udc00-\udfff])*)?:(?=[#\s<])/;
-    this._prefixed = /^((?:[A-Za-z\xc0-\xd6\xd8-\xf6\xf8-\u02ff\u0370-\u037d\u037f-\u1fff\u200c\u200d\u2070-\u218f\u2c00-\u2fef\u3001-\ud7ff\uf900-\ufdcf\ufdf0-\ufffd]|[\ud800-\udb7f][\udc00-\udfff])(?:\.?[\-0-9A-Z_a-z\xb7\xc0-\xd6\xd8-\xf6\xf8-\u037d\u037f-\u1fff\u200c\u200d\u203f\u2040\u2070-\u218f\u2c00-\u2fef\u3001-\ud7ff\uf900-\ufdcf\ufdf0-\ufffd]|[\ud800-\udb7f][\udc00-\udfff])*)?:((?:(?:[0-:A-Z_a-z\xc0-\xd6\xd8-\xf6\xf8-\u02ff\u0370-\u037d\u037f-\u1fff\u200c\u200d\u2070-\u218f\u2c00-\u2fef\u3001-\ud7ff\uf900-\ufdcf\ufdf0-\ufffd]|[\ud800-\udb7f][\udc00-\udfff]|%[0-9a-fA-F]{2}|\\[!#-\/;=?\-@_~])(?:(?:[\.\-0-:A-Z_a-z\xb7\xc0-\xd6\xd8-\xf6\xf8-\u037d\u037f-\u1fff\u200c\u200d\u203f\u2040\u2070-\u218f\u2c00-\u2fef\u3001-\ud7ff\uf900-\ufdcf\ufdf0-\ufffd]|[\ud800-\udb7f][\udc00-\udfff]|%[0-9a-fA-F]{2}|\\[!#-\/;=?\-@_~])*(?:[\-0-:A-Z_a-z\xb7\xc0-\xd6\xd8-\xf6\xf8-\u037d\u037f-\u1fff\u200c\u200d\u203f\u2040\u2070-\u218f\u2c00-\u2fef\u3001-\ud7ff\uf900-\ufdcf\ufdf0-\ufffd]|[\ud800-\udb7f][\udc00-\udfff]|%[0-9a-fA-F]{2}|\\[!#-\/;=?\-@_~]))?)?)(?:[ \t]+|(?=\.?[,;!\^\s#()\[\]\{\}"'<]))/;
+    this._prefixed = /^((?:[A-Za-z\xc0-\xd6\xd8-\xf6\xf8-\u02ff\u0370-\u037d\u037f-\u1fff\u200c\u200d\u2070-\u218f\u2c00-\u2fef\u3001-\ud7ff\uf900-\ufdcf\ufdf0-\ufffd]|[\ud800-\udb7f][\udc00-\udfff])(?:\.?[\-0-9A-Z_a-z\xb7\xc0-\xd6\xd8-\xf6\xf8-\u037d\u037f-\u1fff\u200c\u200d\u203f\u2040\u2070-\u218f\u2c00-\u2fef\u3001-\ud7ff\uf900-\ufdcf\ufdf0-\ufffd]|[\ud800-\udb7f][\udc00-\udfff])*)?:((?:(?:[0-:A-Z_a-z\xc0-\xd6\xd8-\xf6\xf8-\u02ff\u0370-\u037d\u037f-\u1fff\u200c\u200d\u2070-\u218f\u2c00-\u2fef\u3001-\ud7ff\uf900-\ufdcf\ufdf0-\ufffd]|[\ud800-\udb7f][\udc00-\udfff]|%[0-9a-fA-F]{2}|\\[!#-\/;=?\-@_~])(?:(?:[\.\-0-:A-Z_a-z\xb7\xc0-\xd6\xd8-\xf6\xf8-\u037d\u037f-\u1fff\u200c\u200d\u203f\u2040\u2070-\u218f\u2c00-\u2fef\u3001-\ud7ff\uf900-\ufdcf\ufdf0-\ufffd]|[\ud800-\udb7f][\udc00-\udfff]|%[0-9a-fA-F]{2}|\\[!#-\/;=?\-@_~])*(?:[\-0-:A-Z_a-z\xb7\xc0-\xd6\xd8-\xf6\xf8-\u037d\u037f-\u1fff\u200c\u200d\u203f\u2040\u2070-\u218f\u2c00-\u2fef\u3001-\ud7ff\uf900-\ufdcf\ufdf0-\ufffd]|[\ud800-\udb7f][\udc00-\udfff]|%[0-9a-fA-F]{2}|\\[!#-\/;=?\-@_~]))?)?)(?:[ \t]+|(?=\.?[,;!\^\s#()\[\]\{\}"'<>]))/;
     this._variable = /^\?(?:(?:[A-Z_a-z\xc0-\xd6\xd8-\xf6\xf8-\u02ff\u0370-\u037d\u037f-\u1fff\u200c\u200d\u2070-\u218f\u2c00-\u2fef\u3001-\ud7ff\uf900-\ufdcf\ufdf0-\ufffd]|[\ud800-\udb7f][\udc00-\udfff])(?:[\-0-:A-Z_a-z\xb7\xc0-\xd6\xd8-\xf6\xf8-\u037d\u037f-\u1fff\u200c\u200d\u203f\u2040\u2070-\u218f\u2c00-\u2fef\u3001-\ud7ff\uf900-\ufdcf\ufdf0-\ufffd]|[\ud800-\udb7f][\udc00-\udfff])*)(?=[.,;!\^\s#()\[\]\{\}"'<])/;
-    this._blank = /^_:((?:[0-9A-Z_a-z\xc0-\xd6\xd8-\xf6\xf8-\u02ff\u0370-\u037d\u037f-\u1fff\u200c\u200d\u2070-\u218f\u2c00-\u2fef\u3001-\ud7ff\uf900-\ufdcf\ufdf0-\ufffd]|[\ud800-\udb7f][\udc00-\udfff])(?:\.?[\-0-9A-Z_a-z\xb7\xc0-\xd6\xd8-\xf6\xf8-\u037d\u037f-\u1fff\u200c\u200d\u203f\u2040\u2070-\u218f\u2c00-\u2fef\u3001-\ud7ff\uf900-\ufdcf\ufdf0-\ufffd]|[\ud800-\udb7f][\udc00-\udfff])*)(?:[ \t]+|(?=\.?[,;:\s#()\[\]\{\}"'<]))/;
+    this._blank = /^_:((?:[0-9A-Z_a-z\xc0-\xd6\xd8-\xf6\xf8-\u02ff\u0370-\u037d\u037f-\u1fff\u200c\u200d\u2070-\u218f\u2c00-\u2fef\u3001-\ud7ff\uf900-\ufdcf\ufdf0-\ufffd]|[\ud800-\udb7f][\udc00-\udfff])(?:\.?[\-0-9A-Z_a-z\xb7\xc0-\xd6\xd8-\xf6\xf8-\u037d\u037f-\u1fff\u200c\u200d\u203f\u2040\u2070-\u218f\u2c00-\u2fef\u3001-\ud7ff\uf900-\ufdcf\ufdf0-\ufffd]|[\ud800-\udb7f][\udc00-\udfff])*)(?:[ \t]+|(?=\.?[,;:\s#()\[\]\{\}"'<>]))/;
     this._number = /^[\-+]?(?:(\d+\.\d*|\.?\d+)[eE][\-+]?|\d*(\.)?)\d+(?=\.?[,;:\s#()\[\]\{\}"'<])/;
     this._boolean = /^(?:true|false)(?=[.,;\s#()\[\]\{\}"'<])/;
     this._keyword = /^@[a-z]+(?=[\s#<:])/i;
@@ -143,11 +143,19 @@ export default class N3Lexer {
             return reportSyntaxError(this);
           type = 'IRI';
         }
+        // Try to find a nested triple
+        else if (input.length > 1 && input[1] === '<')
+          type = '<<', matchLength = 2;
         // Try to find a backwards implication arrow
         else if (this._n3Mode && input.length > 1 && input[1] === '=')
           type = 'inverse', matchLength = 2, value = '>';
         break;
 
+      case '>':
+        if (input.length > 1 && input[1] === '>')
+          type = '>>', matchLength = 2;
+        break;
+
       case '_':
         // Try to find a blank node. Since it can contain (but not end with) a dot,
         // we always need a non-dot character before deciding it is a blank node.
diff --git a/src/N3Parser.js b/src/N3Parser.js
@@ -19,13 +19,16 @@ export default class N3Parser {
     // Set supported features depending on the format
     var format = (typeof options.format === 'string') ?
                  options.format.match(/\w*$/)[0].toLowerCase() : '',
-        isTurtle = format === 'turtle', isTriG = format === 'trig',
+        isTurtle = /turtle/.test(format), isTriG = /trig/.test(format),
         isNTriples = /triple/.test(format), isNQuads = /quad/.test(format),
         isN3 = this._n3Mode = /n3/.test(format),
         isLineMode = isNTriples || isNQuads;
     if (!(this._supportsNamedGraphs = !(isTurtle || isN3)))
       this._readPredicateOrNamedGraph = this._readPredicate;
+    // Support triples in other graphs
     this._supportsQuads = !(isTurtle || isTriG || isNTriples || isN3);
+    // Support nesting of triples
+    this._supportsRDFStar = format === '' || /star|\*$/.test(format);
     // Disable relative IRIs in N-Triples or N-Quads mode
     if (isLineMode)
       this._resolveRelativeIRI = function (iri) { return null; };
@@ -228,6 +231,12 @@ export default class N3Parser {
         this._subject = this._literal(token.value, this._namedNode(token.prefix));
 
       break;
+    case '<<':
+      if (!this._supportsRDFStar)
+        return this._error('Unexpected RDF* syntax', token);
+      this._saveContext('<<', this._graph, null, null, null);
+      this._graph = null;
+      return this._readSubject;
     default:
       // Read the subject entity
       if ((this._subject = this._readEntity(token)) === undefined)
@@ -304,6 +313,12 @@ export default class N3Parser {
       this._saveContext('formula', this._graph, this._subject, this._predicate,
                         this._graph = this._blankNode());
       return this._readSubject;
+    case '<<':
+      if (!this._supportsRDFStar)
+        return this._error('Unexpected RDF* syntax', token);
+      this._saveContext('<<', this._graph, this._subject, this._predicate, null);
+      this._graph = null;
+      return this._readSubject;
     default:
       // Read the object entity
       if ((this._object = this._readEntity(token)) === undefined)
@@ -802,6 +817,37 @@ export default class N3Parser {
     return this._readPath;
   }
 
+  // ### `_readRDFStarTailOrGraph` reads the graph of a nested RDF* quad or the end of a nested RDF* triple
+  _readRDFStarTailOrGraph(token) {
+    if (token.type !== '>>') {
+      // An entity means this is a quad (only allowed if not already inside a graph)
+      if (this._supportsQuads && this._graph === null && (this._graph = this._readEntity(token)) !== undefined)
+        return this._readRDFStarTail;
+      return this._error('Expected >> to follow "' + this._object.id + '"', token);
+    }
+    return this._readRDFStarTail(token);
+  }
+
+  // ### `_readRDFStarTail` reads the end of a nested RDF* triple
+  _readRDFStarTail(token) {
+    if (token.type !== '>>')
+      return this._error(`Expected >> but got ${token.type}`, token);
+    // Read the quad and restore the previous context
+    const quad = this._quad(this._subject, this._predicate, this._object,
+      this._graph || this.DEFAULTGRAPH);
+    this._restoreContext();
+    // If the triple was the subject, continue by reading the predicate.
+    if (this._subject === null) {
+      this._subject = quad;
+      return this._readPredicate;
+    }
+    // If the triple was the object, read context end.
+    else {
+      this._object = quad;
+      return this._getContextEndReader();
+    }
+  }
+
   // ### `_getContextEndReader` gets the next reader function at the end of a context
   _getContextEndReader() {
     var contextStack = this._contextStack;
@@ -815,6 +861,8 @@ export default class N3Parser {
       return this._readListItem;
     case 'formula':
       return this._readFormulaTail;
+    case '<<':
+      return this._readRDFStarTailOrGraph;
     }
   }
 
diff --git a/test/N3Lexer-test.js b/test/N3Lexer-test.js
@@ -28,6 +28,11 @@ describe('Lexer', function () {
                      { type: 'IRI', value: 'http://ex.org/?bla#foo', line: 1 },
                      { type: 'eof', line: 1 }));
 
+    it('should tokenize a split IRI',
+      shouldTokenize(streamOf('<', 'http://ex.org/?bla#foo>'),
+        { type: 'IRI', value: 'http://ex.org/?bla#foo', line: 1 },
+        { type: 'eof', line: 1 }));
+
     it('should not tokenize an IRI with disallowed characters',
       shouldNotTokenize('<http://ex.org/bla"foo>',
                         'Unexpected "<http://ex.org/bla"foo>" on line 1.'));
@@ -788,6 +793,13 @@ describe('Lexer', function () {
                      { type: 'IRI', value: 'b', line: 1 },
                      { type: 'eof', line: 1 }));
 
+    it('should tokenize a split left implication',
+      shouldTokenize(streamOf('<a> <', '= <b> '),
+        { type: 'IRI', value: 'a', line: 1 },
+        { type: 'inverse', value: '>', line: 1 },
+        { type: 'IRI', value: 'b', line: 1 },
+        { type: 'eof', line: 1 }));
+
     it('should tokenize paths',
       shouldTokenize(':joe!fam:mother!loc:office!loc:zip :joe!fam:mother^fam:mother',
                      { type: 'prefixed', prefix: '', value: 'joe', line: 1 },
@@ -812,6 +824,220 @@ describe('Lexer', function () {
       new Lexer().tokenize({ on: function () {} });
     });
 
+    it('should tokenize an Quadterm start',
+      shouldTokenize('<<',
+        { type: '<<', line: 1 }, { type: 'eof', line: 1 }));
+
+    it('should tokenize a split Quadterm start',
+      shouldTokenize(streamOf('<', '<'),
+        { type: '<<', line: 1 }, { type: 'eof', line: 1 }));
+
+    it('should tokenize an Quadterm end',
+      shouldTokenize('>>',
+        { type: '>>', line: 1 }, { type: 'eof', line: 1 }));
+
+    it('should tokenize an empty Quadterm',
+      shouldTokenize('<< >>',
+        { type: '<<', line: 1 },
+        { type: '>>', line: 1 },
+        { type: 'eof', line: 1 }));
+
+    it('should tokenize an RDF* statement with IRIs',
+      shouldTokenize('<<<http://ex.org/?bla#foo> \n\t<http://ex.org/?bla#bar> \n\t<http://ex.org/?bla#boo>>> .',
+        { type: '<<', line: 1 },
+        { type: 'IRI', value: 'http://ex.org/?bla#foo', line: 1 },
+        { type: 'IRI', value: 'http://ex.org/?bla#bar', line: 2 },
+        { type: 'IRI', value: 'http://ex.org/?bla#boo', line: 3 },
+        { type: '>>', line: 3 },
+        { type: '.', line: 3 },
+        { type: 'eof', line: 3 }));
+
+    it('should not tokenize a wrongly closed RDF* statement with IRIs',
+      shouldNotTokenize('<<<http://ex.org/?bla#foo> \n\t<http://ex.org/?bla#bar> \n\t<http://ex.org/?bla#boo>> .',
+        'Unexpected ">" on line 3.'));
+
+    it('should tokenize a split RDF* statement with IRIs',
+      shouldTokenize(streamOf('<', '<<http://ex.org/?bla#foo> \n\t<http://ex.org/?bla#bar> \n\t<http://ex.org/?bla#boo>>> .'),
+        { type: '<<', line: 1 },
+        { type: 'IRI', value: 'http://ex.org/?bla#foo', line: 1 },
+        { type: 'IRI', value: 'http://ex.org/?bla#bar', line: 2 },
+        { type: 'IRI', value: 'http://ex.org/?bla#boo', line: 3 },
+        { type: '>>', line: 3 },
+        { type: '.', line: 3 },
+        { type: 'eof', line: 3 }));
+
+    it('should tokenize an RDF* statement with literals',
+      shouldTokenize('<<"string"@en "string"@nl-be "string"@EN>> .',
+        { type: '<<', line: 1 },
+        { type: 'literal', value: 'string', line: 1 },
+        { type: 'langcode', value: 'en', line: 1 },
+        { type: 'literal', value: 'string', line: 1 },
+        { type: 'langcode', value: 'nl-be', line: 1 },
+        { type: 'literal', value: 'string', line: 1 },
+        { type: 'langcode', value: 'EN', line: 1 },
+        { type: '>>', line: 1 },
+        { type: '.', line: 1 },
+        { type: 'eof', line: 1 }));
+
+    it('should tokenize a prefixed iri followed by the end of a QuadTerm',
+      shouldTokenize('c:c>> .',
+        { type: 'prefixed', prefix: 'c', value: 'c', line: 1 },
+        { type: '>>', line: 1 },
+        { type: '.', line: 1 },
+        { type: 'eof', line: 1 }));
+
+    it('should tokenize an RDF* statement with prefixed names',
+      shouldTokenize('<<a:a b:b c:c>> .',
+        { type: '<<', line: 1 },
+        { type: 'prefixed', prefix: 'a', value: 'a', line: 1 },
+        { type: 'prefixed', prefix: 'b', value: 'b', line: 1 },
+        { type: 'prefixed', prefix: 'c', value: 'c', line: 1 },
+        { type: '>>', line: 1 },
+        { type: '.', line: 1 },
+        { type: 'eof', line: 1 }));
+
+    it('should tokenize an RDF* statement with blank nodes',
+      shouldTokenize('<<_:a _:b _:c>> .',
+        { type: '<<', line: 1 },
+        { type: 'blank', prefix: '_', value: 'a', line: 1 },
+        { type: 'blank', prefix: '_', value: 'b', line: 1 },
+        { type: 'blank', prefix: '_', value: 'c', line: 1 },
+        { type: '>>', line: 1 },
+        { type: '.', line: 1 },
+        { type: 'eof', line: 1 }));
+
+    it('should tokenize an RDF* statement with mixed types',
+      shouldTokenize('<<<http://ex.org/?bla#foo> "string"@nl-be c:c>> .',
+        { type: '<<', line: 1 },
+        { type: 'IRI', value: 'http://ex.org/?bla#foo', line: 1 },
+        { type: 'literal', value: 'string', line: 1 },
+        { type: 'langcode', value: 'nl-be', line: 1 },
+        { type: 'prefixed', prefix: 'c', value: 'c', line: 1 },
+        { type: '>>', line: 1 },
+        { type: '.', line: 1 },
+        { type: 'eof', line: 1 }));
+
+    it('should tokenize an RDF* statement with mixed types',
+      shouldTokenize('<<_:a a:a "string"@EN>> .',
+        { type: '<<', line: 1 },
+        { type: 'blank', prefix: '_', value: 'a', line: 1 },
+        { type: 'prefixed', prefix: 'a', value: 'a', line: 1 },
+        { type: 'literal', value: 'string', line: 1 },
+        { type: 'langcode', value: 'EN', line: 1 },
+        { type: '>>', line: 1 },
+        { type: '.', line: 1 },
+        { type: 'eof', line: 1 }));
+
+    it('should tokenize an RDF* statement with mixed types',
+      shouldTokenize('<<"literal"@AU <http://ex.org/?bla#foo> _:a>> .',
+        { type: '<<', line: 1 },
+        { type: 'literal', value: 'literal', line: 1 },
+        { type: 'langcode', value: 'AU', line: 1 },
+        { type: 'IRI', value: 'http://ex.org/?bla#foo', line: 1 },
+        { type: 'blank', prefix: '_', value: 'a', line: 1 },
+        { type: '>>', line: 1 },
+        { type: '.', line: 1 },
+        { type: 'eof', line: 1 }));
+
+    it('should tokenize RDF* statements with shared subjects',
+      shouldTokenize('<<<a> <b> <c>;\n<d> <e>>>.',
+        { type: '<<', line: 1 },
+        { type: 'IRI', value: 'a', line: 1 },
+        { type: 'IRI', value: 'b', line: 1 },
+        { type: 'IRI', value: 'c', line: 1 },
+        { type: ';', line: 1 },
+        { type: 'IRI', value: 'd', line: 2 },
+        { type: 'IRI', value: 'e', line: 2 },
+        { type: '>>', line: 2 },
+        { type: '.', line: 2 },
+        { type: 'eof', line: 2 }));
+
+    it('should tokenize RDF* statements with shared subjects and predicates',
+      shouldTokenize('<<<a> <b> <c>,\n<d>>>.',
+        { type: '<<', line: 1 },
+        { type: 'IRI', value: 'a', line: 1 },
+        { type: 'IRI', value: 'b', line: 1 },
+        { type: 'IRI', value: 'c', line: 1 },
+        { type: ',', line: 1 },
+        { type: 'IRI', value: 'd', line: 2 },
+        { type: '>>', line: 2 },
+        { type: '.', line: 2 },
+        { type: 'eof', line: 2 }));
+
+    it('should tokenize an RDF* statement with shared subjects and predicates and prefixed names',
+      shouldTokenize('<<a:a b:b c:c;d:d e:e,f:f>> .',
+        { type: '<<', line: 1 },
+        { type: 'prefixed', prefix: 'a', value: 'a', line: 1 },
+        { type: 'prefixed', prefix: 'b', value: 'b', line: 1 },
+        { type: 'prefixed', prefix: 'c', value: 'c', line: 1 },
+        { type: ';', line: 1 },
+        { type: 'prefixed', prefix: 'd', value: 'd', line: 1 },
+        { type: 'prefixed', prefix: 'e', value: 'e', line: 1 },
+        { type: ',', line: 1 },
+        { type: 'prefixed', prefix: 'f', value: 'f', line: 1 },
+        { type: '>>', line: 1 },
+        { type: '.', line: 1 },
+        { type: 'eof', line: 1 }));
+
+    it('should tokenize a QuadTerm followed by other tokens',
+      shouldTokenize('<<_:a <b> "lit"@EN>> _:a b:b.',
+        { type: '<<', line: 1 },
+        { type: 'blank', prefix: '_', value: 'a', line: 1 },
+        { type: 'IRI', value: 'b', line: 1 },
+        { type: 'literal', value: 'lit', line: 1 },
+        { type: 'langcode', value: 'EN', line: 1 },
+        { type: '>>', line: 1 },
+        { type: 'blank', prefix: '_', value: 'a', line: 1 },
+        { type: 'prefixed', prefix: 'b', value: 'b', line: 1 },
+        { type: '.', line: 1 },
+        { type: 'eof', line: 1 }));
+
+    it('should tokenize a QuadTerm preceded by other tokens',
+      shouldTokenize('"lit"@DE _:b <<_:a b:b "lit"@EN>>.',
+        { type: 'literal', value: 'lit', line: 1 },
+        { type: 'langcode', value: 'DE', line: 1 },
+        { type: 'blank', prefix: '_', value: 'b', line: 1 },
+        { type: '<<', line: 1 },
+        { type: 'blank', prefix: '_', value: 'a', line: 1 },
+        { type: 'prefixed', prefix: 'b', value: 'b', line: 1 },
+        { type: 'literal', value: 'lit', line: 1 },
+        { type: 'langcode', value: 'EN', line: 1 },
+        { type: '>>', line: 1 },
+        { type: '.', line: 1 },
+        { type: 'eof', line: 1 }));
+
+    it('should tokenize a nested QuadTerm as subject in a statement',
+      shouldTokenize('<<<<_:b <b> "lit"@DE>> <a> "lit"@EN>>.',
+        { type: '<<', line: 1 },
+        { type: '<<', line: 1 },
+        { type: 'blank', prefix: '_', value: 'b', line: 1 },
+        { type: 'IRI', value: 'b', line: 1 },
+        { type: 'literal', value: 'lit', line: 1 },
+        { type: 'langcode', value: 'DE', line: 1 },
+        { type: '>>', line: 1 },
+        { type: 'IRI', value: 'a', line: 1 },
+        { type: 'literal', value: 'lit', line: 1 },
+        { type: 'langcode', value: 'EN', line: 1 },
+        { type: '>>', line: 1 },
+        { type: '.', line: 1 },
+        { type: 'eof', line: 1 }));
+
+    it('should tokenize a nested QuadTerm as object in a statement',
+      shouldTokenize('<<a:a _:a <<_:b <b> "lit"@DE>>>>.',
+        { type: '<<', line: 1 },
+        { type: 'prefixed', prefix: 'a', value: 'a', line: 1 },
+        { type: 'blank', prefix: '_', value: 'a', line: 1 },
+        { type: '<<', line: 1 },
+        { type: 'blank', prefix: '_', value: 'b', line: 1 },
+        { type: 'IRI', value: 'b', line: 1 },
+        { type: 'literal', value: 'lit', line: 1 },
+        { type: 'langcode', value: 'DE', line: 1 },
+        { type: '>>', line: 1 },
+        { type: '>>', line: 1 },
+        { type: '.', line: 1 },
+        { type: 'eof', line: 1 }));
+
+
     describe('passing data after the stream has been finished', function () {
       var tokens = [], error;
       before(function () {
diff --git a/test/N3Parser-test.js b/test/N3Parser-test.js