Remove extract_text and extract_doc in favor of extract_sigle Change-Id: I6577a8f453baab96e684da3b2238a31b4f0175e3

commit: 955b75b80d644d17558b39496d8a8f9eed987505 [log] [tgz]
author: Akron <nils@diewald-online.de> Thu Feb 21 14:28:41 2019 +0100
committer: Akron <nils@diewald-online.de> Thu Feb 21 14:28:41 2019 +0100
tree: 9a64bbaee51db210973a2b698c0e7b817059d650
parent: 31a08cb48604ae8e184cbd218b3b1377b5dbbc18 [diff]
diff --git a/script/korapxml2krill b/script/korapxml2krill
index d53004b..5e5b315 100644
--- a/script/korapxml2krill
+++ b/script/korapxml2krill

@@ -769,9 +769,10 @@
       # TODO: Make this OS independent
       print '... ' . (
 
-        $archive->extract_text(
-          ($prefix ? './' : '') . $_, $output
-        ) ? '' : 'not '
+        # TODO:
+        #   - prefix???
+        $archive->extract_sigle([$_], $output, $jobs)
+        ? '' : 'not '
       );
       print "extracted.\n";
     };
@@ -1004,7 +1005,7 @@
       # because extraction can be horrible slow!
 
       # Extract from archive
-      if ($archive->extract_text($dirs[$i], $temp)) {
+      if ($archive->extract_sigle([join('/', $corpus, $doc, $text)], $temp, $sequential_extraction ? 1 : $jobs)) {
 
         # Create corpus directory
         my $input = catdir("$temp", $corpus);
@@ -1108,13 +1109,9 @@
 
         print "\n";
 
-        # TODO: Make this OS independent
-        my $path = ($prefix ? './' : '') . $_;
-
         print '... ' . (
-          $archive->extract_doc(
-            $path, $output, $sequential_extraction ? 1 : $jobs
-          ) ? '' : 'not '
+          $archive->extract_sigle([$_], $output, $sequential_extraction ? 1 : $jobs)
+            ? '' : 'not '
         );
         print "extracted.\n";
       }
commit	955b75b80d644d17558b39496d8a8f9eed987505	[log] [tgz]
author	Akron <nils@diewald-online.de>	Thu Feb 21 14:28:41 2019 +0100
committer	Akron <nils@diewald-online.de>	Thu Feb 21 14:28:41 2019 +0100
tree	9a64bbaee51db210973a2b698c0e7b817059d650
parent	31a08cb48604ae8e184cbd218b3b1377b5dbbc18 [diff]