Read all files from a directory
This commit is contained in:
parent
0620f42fa4
commit
68efc348bd
4
pom.xml
4
pom.xml
|
@ -14,8 +14,8 @@
|
||||||
|
|
||||||
<properties>
|
<properties>
|
||||||
<project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
|
<project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
|
||||||
<maven.compiler.source>1.7</maven.compiler.source>
|
<maven.compiler.source>1.8</maven.compiler.source>
|
||||||
<maven.compiler.target>1.7</maven.compiler.target>
|
<maven.compiler.target>1.8</maven.compiler.target>
|
||||||
</properties>
|
</properties>
|
||||||
|
|
||||||
<dependencies>
|
<dependencies>
|
||||||
|
|
|
@ -0,0 +1,32 @@
|
||||||
|
package org.RI.P1;
|
||||||
|
|
||||||
|
import java.io.File;
|
||||||
|
import java.io.IOException;
|
||||||
|
import java.nio.file.Files;
|
||||||
|
import java.nio.file.Path;
|
||||||
|
import java.nio.file.Paths;
|
||||||
|
import java.util.List;
|
||||||
|
import java.util.stream.Collectors;
|
||||||
|
|
||||||
|
import org.apache.tika.exception.TikaException;
|
||||||
|
import org.xml.sax.SAXException;
|
||||||
|
|
||||||
|
public class AnalyzeDirectory {
|
||||||
|
private static List<File> files;
|
||||||
|
|
||||||
|
private static void readFiles(String directory) throws IOException {
|
||||||
|
files = Files.walk(Paths.get(directory)).filter(Files::isRegularFile).map(Path::toFile)
|
||||||
|
.collect(Collectors.toList());
|
||||||
|
}
|
||||||
|
|
||||||
|
public static void main(String[] args) throws IOException, TikaException, SAXException {
|
||||||
|
String directory = args[0];
|
||||||
|
readFiles(directory);
|
||||||
|
for (File file : files) {
|
||||||
|
FileData data = new FileData(file);
|
||||||
|
System.out.println(data);
|
||||||
|
System.out.println("--------------------------------------------------------------------------");
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
}
|
|
@ -30,13 +30,14 @@ public class FileData {
|
||||||
FileData() {
|
FileData() {
|
||||||
}
|
}
|
||||||
|
|
||||||
FileData(File file) throws FileNotFoundException {
|
FileData(File file) throws IOException, TikaException, SAXException {
|
||||||
inputStream = new FileInputStream(file);
|
inputStream = new FileInputStream(file);
|
||||||
metadata = new Metadata();
|
metadata = new Metadata();
|
||||||
parser = new AutoDetectParser();
|
parser = new AutoDetectParser();
|
||||||
contentHandler = new BodyContentHandler(-1);
|
contentHandler = new BodyContentHandler(-1);
|
||||||
parseContext = new ParseContext();
|
parseContext = new ParseContext();
|
||||||
langIdentifier = new OptimaizeLangDetector().loadModels();
|
langIdentifier = new OptimaizeLangDetector().loadModels();
|
||||||
|
setMetadata();
|
||||||
}
|
}
|
||||||
|
|
||||||
private void setMetadata() throws IOException, TikaException, SAXException {
|
private void setMetadata() throws IOException, TikaException, SAXException {
|
||||||
|
@ -53,14 +54,4 @@ public class FileData {
|
||||||
+ language.getLanguage() + "\n";
|
+ language.getLanguage() + "\n";
|
||||||
}
|
}
|
||||||
|
|
||||||
public static void main(String[] args) throws IOException, TikaException, SAXException {
|
|
||||||
try {
|
|
||||||
File file = new File(args[0]);
|
|
||||||
FileData data = new FileData(file);
|
|
||||||
data.setMetadata();
|
|
||||||
System.out.println(data);
|
|
||||||
} catch (FileNotFoundException exp) {
|
|
||||||
System.out.println("The file " + args[0] + " could not be found");
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in New Issue