|
|
(4 intermediate revisions by the same user not shown) |
Line 1: |
Line 1: |
− | #!/usr/bin/perl
| + | {{lowercase}}{{svn|tools|osv2wiki.pl}} |
− | # Imports rows from an OpenOffice spreadsheet file (*.ods) into wiki record articles{{perl}}
| |
− | # - processes only the first sheet
| |
− | # - ignores empty rows
| |
− | use strict;
| |
− | require('xml.pl');
| |
− | require('wiki.pl');
| |
| | | |
− | # The details of the wiki to add the records to
| + | '''ods2wiki''' is a way to import data from a Open Office spreadsheet files into a MediaWiki. |
− | my $wiki = 'http://svn.localhost/wiki/index.php';
| |
− | my $user = 'foo';
| |
− | my $pass = 'bar';
| |
| | | |
− | # The name of the record template
| + | [[Category:Tools]][[Category:PERL]] |
− | my $tmpl = 'Activity';
| |
− | | |
− | # Column names and regex to determine rows to extract (case insensitive)
| |
− | my %filter = (
| |
− | 'type' => 'hours'
| |
− | );
| |
− | | |
− | # Names of columns to include from source data and their target template parameter names
| |
− | my @mapcols = (
| |
− | );
| |
− | | |
− | # Additional parameters and default values to add
| |
− | my @addcols = (
| |
− | );
| |
− | | |
− | # Log in to the wiki
| |
− | wikiLogin($::wiki,$::user,$::pass) or exit;
| |
− | | |
− | # Extract the content.xml file from the .ods archive
| |
− | my $xml = $ARGV[0] or die "Please specify a .ods file to import rows from";
| |
− | | |
− | # Convert the XML to a hash tree (see http://www.organicdesign.co.nz/xml.pl)
| |
− | $xml = xmlParse(join('', qx( unzip -p $xml content.xml )));
| |
− | | |
− | # Extract the data from the hash tree and add to the wiki
| |
− | my %cols = ();
| |
− | my $first = 1;
| |
− | for (@{$$xml{-content}}) {
| |
− | for (@{$$_{-content}}) {
| |
− | if ($$_{-name} eq 'office:body') {
| |
− | for (@{$$_{-content}}) {
| |
− | my $done = 0;
| |
− | for (@{$$_{-content}}) {
| |
− |
| |
− | # Only process rows for the first sheet
| |
− | if ($$_{-name} eq 'table:table' && $done == 0) {
| |
− | $done++;
| |
− |
| |
− | # Loop through the rows of this sheet
| |
− | for (@{$$_{-content}}) {
| |
− | my @row = ();
| |
− | for (@{$$_{-content}}) {
| |
− |
| |
− | # Add this cell's content to the row
| |
− | my $cell = '';
| |
− | $cell = $$_{-content}[0] for @{$$_{-content}};
| |
− | push @row, $cell;
| |
− |
| |
− | # Handle the table:number-columns-repeated attribute
| |
− | if (defined $$_{'table:number-columns-repeated'} && $$_{'table:number-columns-repeated'} < 100) {
| |
− | push @row, $cell while --$$_{'table:number-columns-repeated'};
| |
− | }
| |
− | }
| |
− |
| |
− | # Process this row (unless empty)
| |
− | if (join('', @row)) {
| |
− |
| |
− | # Process this data row (or define cols if first row)
| |
− | if ($first) {
| |
− | for (0..$#row) { $cols{lc $row[$_]} = $_ }
| |
− | $first = 0;
| |
− | } else {
| |
− |
| |
− | # Check if it passes through the filter
| |
− | my $fail = 0;
| |
− | while (my ($col, $pat) = each(%filter)) {
| |
− | $fail = 1 unless $row[$cols{lc $col}] =~ /$pat/i;
| |
− | }
| |
− |
| |
− | # Process this row if it passed
| |
− | unless ($fail) {
| |
− | | |
− | # Create record article title
| |
− | | |
− | # Get the current text of the article to be created/updated if any
| |
− | $text = wikiRawPage($wiki, $title, 0);
| |
− | $action = $text ? 'updated' : 'created';
| |
− | | |
− | # Replace, prepend or append the template into the current text
| |
− | for (wikiExamineBraces($text)) { ($pos, $len) = ($_->{OFFSET}, $_->{LENGTH}) if $_->{NAME} eq $tmpl }
| |
− | if (defined $pos) { $text = substr $text, $pos, $len, $tmpl }
| |
− | else { $text = $append ? "$text\n$tmpl" : "$tmpl\n$text" }
| |
− | | |
− | # Update the article
| |
− | $done = wikiEdit(
| |
− | $wiki,
| |
− | $title,
| |
− | $text,
| |
− | "[[Template:$tmpl|$tmpl]] record $action by [[OD:Ods2wiki.pl|ods2wiki.pl]]"
| |
− | );
| |
− |
| |
− | print join("\t", @row)."\n";
| |
− |
| |
− | }
| |
− | }
| |
− | }
| |
− | }
| |
− | }
| |
− | }
| |
− | }
| |
− | }
| |
− | }
| |
− | }
| |