diff --git "a/Niveau-1/Iramuteq/Construction_Dictionnaires_Nom_Esp\303\250ce.pl" "b/Niveau-1/Iramuteq/Construction_Dictionnaires_Nom_Esp\303\250ce.pl" index b98f19e..30bb668 100755 --- "a/Niveau-1/Iramuteq/Construction_Dictionnaires_Nom_Esp\303\250ce.pl" +++ "b/Niveau-1/Iramuteq/Construction_Dictionnaires_Nom_Esp\303\250ce.pl" @@ -2,10 +2,12 @@ use strict; use warnings; - +use utf8; +use open qw/:std :utf8/; use Getopt::Long; my ($programme) = $0 =~ m|^(?:.*/)?(.+)|; +$programme = decode_utf8($programme); my $input = ""; my $lexique = "lexique.txt"; @@ -63,4 +65,4 @@ print STDERR " -o output : liste des expressions espèces\n"; exit $code; -} \ No newline at end of file +} diff --git "a/Niveau-2/Vieillissement_V1/Iramuteq/Pr\303\251paration_Donn\303\251es_entr\303\251e.pl" "b/Niveau-2/Vieillissement_V1/Iramuteq/Pr\303\251paration_Donn\303\251es_entr\303\251e.pl" index 4b3474f..26cde8a 100644 --- "a/Niveau-2/Vieillissement_V1/Iramuteq/Pr\303\251paration_Donn\303\251es_entr\303\251e.pl" +++ "b/Niveau-2/Vieillissement_V1/Iramuteq/Pr\303\251paration_Donn\303\251es_entr\303\251e.pl" @@ -25,21 +25,26 @@ usage(2) if not $dir or not $source; opendir(DIR, $dir) or die "Couldn't open file, $!"; - my @files = readdir(DIR); - closedir(DIR); - my $size = @files; +my @files = grep {not /^\./} readdir(DIR); +closedir(DIR); +my $size = @files; open(DATA, ">:utf8",$sortie) or -die "Couldn't open file $sortie, $!"; + die "Couldn't open file $sortie, $!"; print METADATA "\"id\",\"sous_corpus\"\n"; -foreach my $file(@files){ - $file =~ /(\pL+)_\d*/; - print DATA "**** *souscorpus_$1\n"; - open(FILE, "<:encoding(UTF-8)", "$dir/$file") or die "Couldn't open file $file, $!"; - my @texte = ; - print DATA @texte; - close(FILE); +foreach my $file (@files){ + if ($file =~ /^(\pL+)_\d*/) + { + print DATA "**** *souscorpus_$1\n"; + open(FILE, "<:encoding(UTF-8)", "$dir/$file") or + die "Couldn't open file $file, $!"; + while() + { + print DATA; + } + close(FILE); + } } close(DATA); @@ -52,4 +57,4 @@ print STDERR "Usage : $programme -d dir -s sortie \n"; exit $code; -} \ No newline at end of file +} diff --git a/Niveau-2/Vieillissement_V2/Iramuteq/Correspondance_Identifient_Istex_NomRevue.pl b/Niveau-2/Vieillissement_V2/Iramuteq/Correspondance_Identifient_Istex_NomRevue.pl index 44affd9..48d4641 100644 --- a/Niveau-2/Vieillissement_V2/Iramuteq/Correspondance_Identifient_Istex_NomRevue.pl +++ b/Niveau-2/Vieillissement_V2/Iramuteq/Correspondance_Identifient_Istex_NomRevue.pl @@ -25,9 +25,9 @@ usage(2) if not $wos or not $info; open(WOS, "<:encoding(UTF-8)", $wos) or -die "Couldn't open file $wos, $!"; + die "Couldn't open file $wos, $!"; open(INFO, ">:encoding(UTF-8)", $info) or -die "Couldn't open file $info, $!"; + die "Couldn't open file $info, $!"; while (my $ligne = ) { diff --git "a/Niveau-2/Vieillissement_V2/Iramuteq/Pr\303\251paration_donn\303\251es_Ira.pl" "b/Niveau-2/Vieillissement_V2/Iramuteq/Pr\303\251paration_donn\303\251es_Ira.pl" index 49e1ce4..8e42d5c 100644 --- "a/Niveau-2/Vieillissement_V2/Iramuteq/Pr\303\251paration_donn\303\251es_Ira.pl" +++ "b/Niveau-2/Vieillissement_V2/Iramuteq/Pr\303\251paration_donn\303\251es_Ira.pl" @@ -10,7 +10,7 @@ my ($programme) = $0 =~ m|^(?:.*/)?(.+)|; $programme = decode_utf8($programme); -my $reportoire = ""; #par exemple "Vv2_new" +my $repertoire = ""; #par exemple "Vv2_new" my $journal = ""; #par exemple "Nom_Du_Revue.txt" my $id = ""; #par exemple "Nom_Du_Article.txt" my $data = ""; #par exemple "Vieillissement_V2_New.txt" @@ -26,38 +26,38 @@ }; $SIG{__WARN__} = sub {warn $_[0];}; -usage(2) if not $reportoire or not $journal or not $id or not $data; +usage(2) if not $repertoire or not $journal or not $id or not $data; +my @a = (); open(REVUE, "<:utf8", $journal) -or die "Couldn't open file $revue, $!"; -my @a = ; - -foreach my $revue (@a){ - chomp($revue); - $revue =~ s/\s/_/g; + or die "Couldn't open file $revue, $!"; +while(my $revue = ) +{ + chomp($revue); + $revue =~ s/\s/_/go; + push(@a, $revue); } +close REVUE; open(ID, "<:utf8", $id) or -die "Couldn't open file $id, $!"; -my @b = ; -foreach my $id (@b){ - chomp($id); -} - + die "Couldn't open file $id, $!"; +chomp(my @b = ); +close ID; open(DATA, ">:encoding(UTF-8)",$data) -or die "Couldn't open file $data, $!"; + or die "Couldn't open file $data, $!"; print DATA "\"revue\",\"id\"\n"; -foreach my $i(0 .. $#a){ - open(FILE, "<:utf8", "$reportoire/$b[$i]") or die "Couldn't open file $b[$i]$!"; +for(my $i = 0 ; $i <= $#a ; $i ++) +{ + open(FILE, "<:utf8", "$repertoire/$b[$i]") or die "Couldn't open file $b[$i]$!"; print DATA "**** *revue_$a[$i] *id_$b[$i]\n"; - my @texte = ; - foreach my $ligne (@texte){ + while(my $ligne = ) + { $ligne =~ s/\*//g; + print DATA $ligne; } - print DATA @texte; close(FILE); } close(DATA); @@ -69,7 +69,7 @@ { my $code = shift; -print STDERR "Usage : $programme -r reportoire -j journal -i id -d data \n"; +print STDERR "Usage : $programme -r repertoire -j journal -i id -d data \n"; exit $code; -} \ No newline at end of file +} diff --git a/Niveau-3/TXM/Extraction_Corps_TEI.pl b/Niveau-3/TXM/Extraction_Corps_TEI.pl index 73b226c..c338de9 100755 --- a/Niveau-3/TXM/Extraction_Corps_TEI.pl +++ b/Niveau-3/TXM/Extraction_Corps_TEI.pl @@ -66,4 +66,4 @@ my $code = shift; print STDERR "Usage: $programme -i input -o output\n"; exit $code; -} \ No newline at end of file +} diff --git a/post_traitement_corpus/rename_file.pl b/post_traitement_corpus/rename_file.pl index 14ef895..e44ee02 100644 --- a/post_traitement_corpus/rename_file.pl +++ b/post_traitement_corpus/rename_file.pl @@ -25,18 +25,18 @@ usage(2) if not $dir or not $source; open(SOURCE, "<:encoding(UTF-8)", $source) -or die "Couldn't open file $source, $!"; + or die "Couldn't open file $source, $!"; -my @sourcefile = ; +chomp(my @sourcefile = ); my $size = @sourcefile; print STDERR $size; close SOURCE; my %correspondance; -for(my $n=0;$n<@sourcefile;$n++){ - chomp($sourcefile[$n]); - $sourcefile[$n] =~ /(\w{40})(\W*?)(\w{11})/; - $correspondance{$1}=$3; +for(my $n=0 ; $n<= $#sourcefile ; $n++ ) +{ + $sourcefile[$n] =~ /(\w{40})\W*?(\w+)/; + $correspondance{$1} = $2; } #print "$_ $correspondance{$_}\n" for (keys %correspondance);#imprimer une table d'hachage @@ -45,16 +45,22 @@ print STDERR $size_cles; opendir(DIR, $dir) or die "Couldn't open the directory $dir, $!"; - my @files = readdir(DIR); - closedir(DIR); +my @files = grep {$_ ne '.' and $_ ne '..'} readdir(DIR); +closedir(DIR); foreach my $file (@files){ my $new = $file; $new =~ s/(\w{40}).txt/$1/; - $new = $correspondance{"$new"}; - $new =~ s/$/.txt/; - rename("$dir/$file","$dir/$new"); - print "$file => $new\n"; + if ($correspondance{"$new"}) + { + $new = $correspondance{"$new"}; + rename("$dir/$file","$dir/$new.txt"); + print "$file => $new.txt\n"; + } + else + { + print "Pas de correspondance pour le fichier $file\n"; + } } exit 0; @@ -67,6 +73,3 @@ exit $code; } - - -