1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18 package org.apache.any23.extractor.html;
19
20 import org.apache.any23.extractor.ExtractorFactory;
21 import org.junit.Test;
22 import org.eclipse.rdf4j.model.IRI;
23 import org.eclipse.rdf4j.model.ValueFactory;
24 import org.eclipse.rdf4j.model.impl.SimpleValueFactory;
25 import org.eclipse.rdf4j.repository.RepositoryException;
26
27
28
29
30
31
32 public class HeadLinkExtractorTest extends AbstractExtractorTestCase {
33
34 @Override
35 protected ExtractorFactory<?> getExtractorFactory() {
36 return new HeadLinkExtractorFactory();
37 }
38
39 @Test
40 public void testLinkExtraction() throws RepositoryException {
41 assertExtract("/html/html-head-link-extractor.html");
42 assertModelNotEmpty();
43 final ValueFactory valueFactory = SimpleValueFactory.getInstance();
44 final IRI externalLinkIRI = valueFactory.createIRI("http://www.myexperiment.org/workflows/16.rdf");
45 assertContains(AbstractExtractorTestCase.baseIRI,
46 valueFactory.createIRI("http://www.w3.org/1999/xhtml/vocab#alternate"), externalLinkIRI
47
48 );
49 assertContains(externalLinkIRI, valueFactory.createIRI("http://purl.org/dc/terms/title"),
50 valueFactory.createLiteral("RDF+XML")
51
52 );
53 assertContains(externalLinkIRI, valueFactory.createIRI("http://purl.org/dc/terms/format"),
54 valueFactory.createLiteral("application/rdf+xml")
55
56 );
57 }
58 }