Skip to content
GitLab
Projects
Groups
Snippets
Help
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
S
scidetect
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Service Desk
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Operations
Operations
Incidents
Environments
Packages & Registries
Packages & Registries
Container Registry
Analytics
Analytics
CI / CD
Repository
Value Stream
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
Cyril Labbe
scidetect
Commits
f4acfdaf
Commit
f4acfdaf
authored
Mar 11, 2015
by
Tien
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
delete temps, added jar
parent
03da7eb9
Changes
4
Hide whitespace changes
Inline
Side-by-side
Showing
4 changed files
with
0 additions
and
541 deletions
+0
-541
dist/SciDetect_Local.jar
dist/SciDetect_Local.jar
+0
-0
src/fr/imag/forge/scidetect/SciDetect_local/Scidetect_Local.java
...imag/forge/scidetect/SciDetect_local/Scidetect_Local.java
+0
-180
src/fr/imag/forge/scidetect/SciDetect_local/ScigenChecker_Local.java~
...forge/scidetect/SciDetect_local/ScigenChecker_Local.java~
+0
-181
src/fr/imag/forge/scidetect/scigenchecker_local/ScigenChecker_Local.java
...ge/scidetect/scigenchecker_local/ScigenChecker_Local.java
+0
-180
No files found.
dist/SciDetect_Local.jar
0 → 100644
View file @
f4acfdaf
File added
src/fr/imag/forge/scidetect/SciDetect_local/Scidetect_Local.java
deleted
100644 → 0
View file @
03da7eb9
/*
* Copyright (C) 2015 UNIVERSITE JOSEPH FOURIER (Grenoble 1)/ Springer-Verlag GmbH
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program. If not, see <http://www.gnu.org/licenses/>.
*/
package
fr.imag.forge.scidetect.SciDetect_local
;
import
fr.imag.forge.scidetect.Checker.Classifier
;
import
fr.imag.forge.scidetect.Checker.DistantCalculator
;
import
fr.imag.forge.scidetect.Checker.Reader
;
import
fr.imag.forge.scidetect.Checker.Utils.DistancesSet
;
import
fr.imag.forge.scidetect.Logger.Log
;
import
fr.imag.forge.scidetect.Corpus.Corpus
;
import
java.io.BufferedReader
;
import
java.io.File
;
import
java.io.FileNotFoundException
;
import
java.io.FileReader
;
import
java.io.IOException
;
import
java.text.DateFormat
;
import
java.text.SimpleDateFormat
;
import
java.util.Date
;
/**
*
* @author Nguyen Minh Tien - minh-tien.nguyen@imag.fr
*/
public
class
Scidetect_Local
{
// private String loglocation;
// private String detailloglocation;
private
String
testpath
;
//private String logtime;
private
Corpus
samples
=
new
Corpus
();
private
Corpus
tests
=
new
Corpus
();
private
String
SamplesFolder
;
//private HashMap<String, HashMap<String, Double>> distant = new HashMap<String, HashMap<String, Double>>();
DistancesSet
distant
=
new
DistancesSet
();
private
Boolean
savedetaillog
=
false
;
/**
* Read in the config file:
*- places where to find samples of each class
*- default places where to write results.
* @throws FileNotFoundException
* @throws IOException
*/
private
void
readconfig
()
throws
FileNotFoundException
,
IOException
{
File
conf
=
new
File
(
"config.txt"
);
BufferedReader
br
=
new
BufferedReader
(
new
FileReader
(
conf
));
String
line
;
while
((
line
=
br
.
readLine
())
!=
null
)
{
if
(!
line
.
startsWith
(
"#"
))
{
// System.out.println(line);
String
[]
b
=
line
.
split
(
"\t"
);
if
(
b
[
0
].
equals
(
"samples"
))
{
SamplesFolder
=
b
[
1
];
}
if
(
b
[
0
].
equals
(
"Default_log_folder"
))
{
Log
.
loglocation
=
b
[
1
];
// System.out.println(loglocation);
}
if
(
b
[
0
].
equals
(
"Default_detail_log_folder"
))
{
Log
.
detailloglocation
=
b
[
1
];
//System.out.println(detailloglocation);
}
}
}
}
/**
* @throws IOException
*/
private
void
compute
()
throws
IOException
{
if
(
testpath
!=
null
)
{
DateFormat
dateFormat
=
new
SimpleDateFormat
(
"HH:mm dd.MM.yyyy"
);
Date
date
=
new
Date
();
Log
.
logtime
=
dateFormat
.
format
(
date
);
try
{
Reader
reader
=
new
Reader
();
reader
.
readconfig
();
samples
=
reader
.
readsamples
(
SamplesFolder
);
tests
=
reader
.
readtests
(
testpath
);
}
catch
(
Exception
e
)
{
System
.
out
.
println
(
"* Something went wrong during:"
);
System
.
out
.
println
(
" - reading the config file"
);
System
.
out
.
println
(
" - or reading the samples (dir data)"
);
System
.
out
.
println
(
" - or txt extraction from pdf"
);
System
.
out
.
println
(
"* Continuing anyway..."
);
//e.printStackTrace();
}
DistantCalculator
dc
=
new
DistantCalculator
();
distant
=
dc
.
caldistant
(
samples
,
tests
);
Classifier
cl
=
new
Classifier
();
String
conclusion
=
cl
.
classify
(
distant
);
System
.
out
.
println
(
conclusion
);
Log
log
=
new
Log
();
log
.
savelog
(
conclusion
);
if
(
savedetaillog
)
{
log
.
savedetaillog
(
distant
);
}
}
else
{
System
.
out
.
println
(
"***** Can not read path to the folder:"
+
testpath
);
System
.
out
.
println
(
"***** The folder should contains file to check"
);
}
}
/**
* Parsing of the command line arguments:
* where to find pdf files, where results should be written
* @param args
*/
public
void
readargs
(
String
[]
args
)
{
if
(
args
.
length
>
0
)
{
for
(
int
i
=
0
;
i
<
args
.
length
;
i
+=
1
)
{
// System.out.println(args[i]);
if
(
args
[
i
].
equals
(
"-l"
))
{
Log
.
loglocation
=
args
[
i
+
1
];
}
if
(
args
[
i
].
equals
(
"-c"
))
{
testpath
=
args
[
i
+
1
];
}
if
(
args
[
i
].
equals
(
"-d"
))
{
savedetaillog
=
true
;
}
if
(
args
[
i
].
equals
(
"-h"
))
{
printUsage
();
}
}
}
else
{
printUsage
();}
}
/**
* To print usage (-h)
*/
private
static
void
printUsage
()
{
System
.
out
.
println
(
"***** Scigen & Co Checker \n"
);
System
.
out
.
println
(
"To test all files in a directory <pathToFilesDirToTest>:"
);
System
.
out
.
println
(
"java -jar ScigenChecker_local.jar -l <pathToLogFile> -c <pathToFilesDirToTest> \n"
);
System
.
out
.
println
(
"To print usage:"
);
System
.
out
.
println
(
"java -jar ScigenChecker_local.jar -h \n"
);
System
.
out
.
println
(
"***** \n"
);
}
/**
* This is the standalone checker. All pdf files in the dir specified after -c are
* checked against classes found in the dir "data". Results are written in the log
* file specified by the -l option. If -d is given a detailled log is produced.
* Example: testing all pdf files in a directory MyConf/PDF/ and having results
* in the MyConf/checklog.txt:
* java -jar ScigenChecker_local.jar -l MyConf/checklog.txt -c MyConf/PDF/
* @param args the command line arguments
* @throws java.io.IOException
*/
public
static
void
main
(
String
[]
args
)
throws
IOException
{
Scidetect_Local
a
=
new
Scidetect_Local
();
a
.
readconfig
();
a
.
readargs
(
args
);
a
.
compute
();
}
}
src/fr/imag/forge/scidetect/SciDetect_local/ScigenChecker_Local.java~
deleted
100644 → 0
View file @
03da7eb9
/*
*
Copyright
(
C
)
2015
UNIVERSITE
JOSEPH
FOURIER
(
Grenoble
1
)/
Springer
-
Verlag
GmbH
*
author
Nguyen
Minh
Tien
-
minh
-
tien
.
nguyen
@
imag
.
fr
*
*
This
program
is
free
software
:
you
can
redistribute
it
and
/
or
modify
*
it
under
the
terms
of
the
GNU
General
Public
License
as
published
by
*
the
Free
Software
Foundation
,
either
version
3
of
the
License
,
or
*
(
at
your
option
)
any
later
version
.
*
*
This
program
is
distributed
in
the
hope
that
it
will
be
useful
,
*
but
WITHOUT
ANY
WARRANTY
;
without
even
the
implied
warranty
of
*
MERCHANTABILITY
or
FITNESS
FOR
A
PARTICULAR
PURPOSE
.
See
the
*
GNU
General
Public
License
for
more
details
.
*
*
You
should
have
received
a
copy
of
the
GNU
General
Public
License
*
along
with
this
program
.
If
not
,
see
<
http
://
www
.
gnu
.
org
/
licenses
/>.
*/
package
fr
.
imag
.
Scidetect
.
scigenchecker_local
;
import
fr
.
imag
.
Scidetect
.
Checker
.
Classifier
;
import
fr
.
imag
.
Scidetect
.
Checker
.
DistantCalculator
;
import
fr
.
imag
.
Scidetect
.
Checker
.
Indexer
;
import
fr
.
imag
.
Scidetect
.
Checker
.
Reader
;
import
fr
.
imag
.
Scidetect
.
Logger
.
Log
;
import
fr
.
imag
.
Scidetect
.
TextExtractor
.
pdfextractor
;
import
java
.
io
.
BufferedReader
;
import
java
.
io
.
File
;
import
java
.
io
.
FileNotFoundException
;
import
java
.
io
.
FileReader
;
import
java
.
io
.
IOException
;
import
java
.
io
.
PrintWriter
;
import
java
.
text
.
DateFormat
;
import
java
.
text
.
SimpleDateFormat
;
import
java
.
util
.
Arrays
;
import
java
.
util
.
Date
;
import
java
.
util
.
HashMap
;
/**
*
*
@
author
tien
*/
public
class
ScigenChecker_Local
{
//
private
String
loglocation
;
//
private
String
detailloglocation
;
private
String
testpath
;
//
private
String
logtime
;
private
HashMap
<
String
,
HashMap
<
String
,
Integer
>>
samples
=
new
HashMap
<
String
,
HashMap
<
String
,
Integer
>>();
private
HashMap
<
String
,
HashMap
<
String
,
Integer
>>
tests
=
new
HashMap
<
String
,
HashMap
<
String
,
Integer
>>();
private
String
SamplesFolder
;
private
HashMap
<
String
,
HashMap
<
String
,
Double
>>
distant
=
new
HashMap
<
String
,
HashMap
<
String
,
Double
>>();
private
Boolean
savedetaillog
=
false
;
/**
*
Read
in
the
config
file
:
*-
places
where
to
find
samples
of
each
class
*-
default
places
where
to
write
results
.
*
@
throws
FileNotFoundException
*
@
throws
IOException
*/
private
void
readconfig
()
throws
FileNotFoundException
,
IOException
{
File
conf
=
new
File
(
"config.txt"
);
BufferedReader
br
=
new
BufferedReader
(
new
FileReader
(
conf
));
String
line
;
while
((
line
=
br
.
readLine
())
!= null) {
if
(
!line.startsWith("#")) {
//
System
.
out
.
println
(
line
);
String
[]
b
=
line
.
split
(
"
\t
"
);
if
(
b
[
0
].
equals
(
"samples"
))
{
SamplesFolder
=
b
[
1
];
}
if
(
b
[
0
].
equals
(
"Default_log_folder"
))
{
Log
.
loglocation
=
b
[
1
];
//
System
.
out
.
println
(
loglocation
);
}
if
(
b
[
0
].
equals
(
"Default_detail_log_folder"
))
{
Log
.
detailloglocation
=
b
[
1
];
//
System
.
out
.
println
(
detailloglocation
);
}
}
}
}
/**
*
@
throws
IOException
*/
private
void
compute
()
throws
IOException
{
if
(
testpath
!= null) {
DateFormat
dateFormat
=
new
SimpleDateFormat
(
"HH:mm dd.MM.yyyy"
);
Date
date
=
new
Date
();
Log
.
logtime
=
dateFormat
.
format
(
date
);
try
{
Reader
reader
=
new
Reader
();
reader
.
readconfig
();
samples
=
reader
.
readsamples
(
SamplesFolder
);
tests
=
reader
.
readtests
(
testpath
);
}
catch
(
Exception
e
)
{
System
.
out
.
println
(
"* Something went wrong during:"
);
System
.
out
.
println
(
" - reading the config file"
);
System
.
out
.
println
(
" - reading the samples (dir data)"
);
System
.
out
.
println
(
" - txt extraction from pdf"
);
System
.
out
.
println
(
"* Continuing anyway..."
);
//
e
.
printStackTrace
();
}
DistantCalculator
dc
=
new
DistantCalculator
();
distant
=
dc
.
caldistant
(
samples
,
tests
);
Classifier
cl
=
new
Classifier
();
String
conclusion
=
cl
.
classify
(
distant
);
System
.
out
.
println
(
conclusion
);
Log
log
=
new
Log
();
log
.
savelog
(
conclusion
);
if
(
savedetaillog
)
{
log
.
savedetaillog
(
distant
);
}
}
else
{
System
.
out
.
println
(
"***** Can not read path to the folder:"
+
testpath
);
System
.
out
.
println
(
"***** The folder should contains file to check"
);
}
}
/**
*
Parsing
of
the
command
line
arguments
:
*
where
to
find
pdf
files
,
where
results
should
be
written
*
@
param
args
*/
public
void
readargs
(
String
[]
args
)
{
if
(
args
.
length
>
0
)
{
for
(
int
i
=
0
;
i
<
args
.
length
;
i
+=
1
)
{
//
System
.
out
.
println
(
args
[
i
]);
if
(
args
[
i
].
equals
(
"-l"
))
{
Log
.
loglocation
=
args
[
i
+
1
];
}
if
(
args
[
i
].
equals
(
"-c"
))
{
testpath
=
args
[
i
+
1
];
}
if
(
args
[
i
].
equals
(
"-d"
))
{
savedetaillog
=
true
;
}
if
(
args
[
i
].
equals
(
"-h"
))
{
printUsage
();
}
}
}
else
{
printUsage
();}
}
/**
*
To
print
usage
(-
h
)
*/
private
static
void
printUsage
()
{
System
.
out
.
println
(
"***** Scigen & Co Checker
\n
"
);
System
.
out
.
println
(
"To test all files in a directory <pathToFilesDirToTest>:"
);
System
.
out
.
println
(
"java -jar ScigenChecker_local.jar -l <pathToLogFile> -c <pathToFilesDirToTest>
\n
"
);
System
.
out
.
println
(
"To print usage:"
);
System
.
out
.
println
(
"java -jar ScigenChecker_local.jar -h
\n
"
);
System
.
out
.
println
(
"*****
\n
"
);
}
/**
*
This
is
the
standalone
checker
.
All
pdf
files
in
the
dir
specified
after
-
c
are
*
checked
against
classes
found
in
the
dir
"data"
.
Results
are
written
in
the
log
*
file
specified
by
the
-
l
option
.
If
-
d
is
given
a
detailled
log
is
produced
.
*
Example
:
testing
all
pdf
files
in
a
directory
MyConf
/
PDF
/
and
having
results
*
in
the
MyConf
/
checklog
.
txt
:
*
java
-
jar
ScigenChecker_local
.
jar
-
l
MyConf
/
checklog
.
txt
-
c
MyConf
/
PDF
/
*
@
param
args
the
command
line
arguments
*/
public
static
void
main
(
String
[]
args
)
throws
IOException
{
ScigenChecker_Local
a
=
new
ScigenChecker_Local
();
a
.
readconfig
();
a
.
readargs
(
args
);
a
.
compute
();
}
}
src/fr/imag/forge/scidetect/scigenchecker_local/ScigenChecker_Local.java
deleted
100644 → 0
View file @
03da7eb9
/*
* Copyright (C) 2015 UNIVERSITE JOSEPH FOURIER (Grenoble 1)/ Springer-Verlag GmbH
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program. If not, see <http://www.gnu.org/licenses/>.
*/
package
fr.imag.forge.scidetect.scigenchecker_local
;
import
fr.imag.forge.scidetect.Checker.Classifier
;
import
fr.imag.forge.scidetect.Checker.DistantCalculator
;
import
fr.imag.forge.scidetect.Checker.Reader
;
import
fr.imag.forge.scidetect.Checker.Utils.DistancesSet
;
import
fr.imag.forge.scidetect.Logger.Log
;
import
fr.imag.forge.scidetect.Corpus.Corpus
;
import
java.io.BufferedReader
;
import
java.io.File
;
import
java.io.FileNotFoundException
;
import
java.io.FileReader
;
import
java.io.IOException
;
import
java.text.DateFormat
;
import
java.text.SimpleDateFormat
;
import
java.util.Date
;
/**
*
* @author Nguyen Minh Tien - minh-tien.nguyen@imag.fr
*/
public
class
ScigenChecker_Local
{
// private String loglocation;
// private String detailloglocation;
private
String
testpath
;
//private String logtime;
private
Corpus
samples
=
new
Corpus
();
private
Corpus
tests
=
new
Corpus
();
private
String
SamplesFolder
;
//private HashMap<String, HashMap<String, Double>> distant = new HashMap<String, HashMap<String, Double>>();
DistancesSet
distant
=
new
DistancesSet
();
private
Boolean
savedetaillog
=
false
;
/**
* Read in the config file:
*- places where to find samples of each class
*- default places where to write results.
* @throws FileNotFoundException
* @throws IOException
*/
private
void
readconfig
()
throws
FileNotFoundException
,
IOException
{
File
conf
=
new
File
(
"config.txt"
);
BufferedReader
br
=
new
BufferedReader
(
new
FileReader
(
conf
));
String
line
;
while
((
line
=
br
.
readLine
())
!=
null
)
{
if
(!
line
.
startsWith
(
"#"
))
{
// System.out.println(line);
String
[]
b
=
line
.
split
(
"\t"
);
if
(
b
[
0
].
equals
(
"samples"
))
{
SamplesFolder
=
b
[
1
];
}
if
(
b
[
0
].
equals
(
"Default_log_folder"
))
{
Log
.
loglocation
=
b
[
1
];
// System.out.println(loglocation);
}
if
(
b
[
0
].
equals
(
"Default_detail_log_folder"
))
{
Log
.
detailloglocation
=
b
[
1
];
//System.out.println(detailloglocation);
}
}
}
}
/**
* @throws IOException
*/
private
void
compute
()
throws
IOException
{
if
(
testpath
!=
null
)
{
DateFormat
dateFormat
=
new
SimpleDateFormat
(
"HH:mm dd.MM.yyyy"
);
Date
date
=
new
Date
();
Log
.
logtime
=
dateFormat
.
format
(
date
);
try
{
Reader
reader
=
new
Reader
();
reader
.
readconfig
();
samples
=
reader
.
readsamples
(
SamplesFolder
);
tests
=
reader
.
readtests
(
testpath
);
}
catch
(
Exception
e
)
{
System
.
out
.
println
(
"* Something went wrong during:"
);
System
.
out
.
println
(
" - reading the config file"
);
System
.
out
.
println
(
" - or reading the samples (dir data)"
);
System
.
out
.
println
(
" - or txt extraction from pdf"
);
System
.
out
.
println
(
"* Continuing anyway..."
);
//e.printStackTrace();
}
DistantCalculator
dc
=
new
DistantCalculator
();
distant
=
dc
.
caldistant
(
samples
,
tests
);
Classifier
cl
=
new
Classifier
();
String
conclusion
=
cl
.
classify
(
distant
);
System
.
out
.
println
(
conclusion
);
Log
log
=
new
Log
();
log
.
savelog
(
conclusion
);
if
(
savedetaillog
)
{
log
.
savedetaillog
(
distant
);
}
}
else
{
System
.
out
.
println
(
"***** Can not read path to the folder:"
+
testpath
);
System
.
out
.
println
(
"***** The folder should contains file to check"
);
}
}
/**
* Parsing of the command line arguments:
* where to find pdf files, where results should be written
* @param args
*/
public
void
readargs
(
String
[]
args
)
{
if
(
args
.
length
>
0
)
{
for
(
int
i
=
0
;
i
<
args
.
length
;
i
+=
1
)
{
// System.out.println(args[i]);
if
(
args
[
i
].
equals
(
"-l"
))
{
Log
.
loglocation
=
args
[
i
+
1
];
}
if
(
args
[
i
].
equals
(
"-c"
))
{
testpath
=
args
[
i
+
1
];
}
if
(
args
[
i
].
equals
(
"-d"
))
{
savedetaillog
=
true
;
}
if
(
args
[
i
].
equals
(
"-h"
))
{
printUsage
();
}
}
}
else
{
printUsage
();}
}
/**
* To print usage (-h)
*/
private
static
void
printUsage
()
{
System
.
out
.
println
(
"***** Scigen & Co Checker \n"
);
System
.
out
.
println
(
"To test all files in a directory <pathToFilesDirToTest>:"
);
System
.
out
.
println
(
"java -jar ScigenChecker_local.jar -l <pathToLogFile> -c <pathToFilesDirToTest> \n"
);
System
.
out
.
println
(
"To print usage:"
);
System
.
out
.
println
(
"java -jar ScigenChecker_local.jar -h \n"
);
System
.
out
.
println
(
"***** \n"
);
}
/**
* This is the standalone checker. All pdf files in the dir specified after -c are
* checked against classes found in the dir "data". Results are written in the log
* file specified by the -l option. If -d is given a detailled log is produced.
* Example: testing all pdf files in a directory MyConf/PDF/ and having results
* in the MyConf/checklog.txt:
* java -jar ScigenChecker_local.jar -l MyConf/checklog.txt -c MyConf/PDF/
* @param args the command line arguments
* @throws java.io.IOException
*/
public
static
void
main
(
String
[]
args
)
throws
IOException
{
ScigenChecker_Local
a
=
new
ScigenChecker_Local
();
a
.
readconfig
();
a
.
readargs
(
args
);
a
.
compute
();
}
}
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment