#!/usr/bin/perl require '/mit/mkgray/perl/dateparse.pl'; require 'ctime.pl'; %colormap = ("Matthew", "#aaaaff", "Nelson", "#ffaaaa", "Oliver", "#aaffaa", "Raffi", "#ffccaa"); @prword = ("No importance", "very low", "low", "medium", "high", "urgent"); @szword = ("Null", "tiny", "small", "medium", "big", "huge"); # A task looks something like this: # # # Do this and that blah blah blah # I can help you if you need it --nelson # # Load up a list of tasks from an XML file into # @tasks, which is an array of Task's if($ARGV[0] eq "-genhtml"){ shift; $slash = $/; undef $/; $f = (<>); $/ = $slash; &parse($f); &printhtml(); exit; } else { require '/home/httpd/cgi-bin/parseform.pl'; $xmlfile = "/home/httpd/xml-todo"; if($ENV{'REQUEST_METHOD'} eq "POST"){ $post = 1; read(STDIN, $q, $ENV{'CONTENT_LENGTH'}); } else{ $post = 0; $q = $ENV{'QUERY_STRING'}; } %form = &parseform($q); $pi = $ENV{'PATH_INFO'}; undef $/; open(F, $xmlfile); $f = (); &parse($f); if($pi ne ""){ if(!flock(F, 2)){ # D'oh, file locked print "Content-type: text/html\n\n"; print "File locked, try again\n"; exit; } } #------------------------------------------------------ if($pi eq "/addtask"){ $nt = new Task($form{Person}, $form{Priority}, $form{Size}, time(), -1, $form{Description}); push(@tasks, $nt); &writexml(); print "Location: /hive-todo.cgi\n\n"; } #------------------------------------------------------ elsif($pi eq "/xml"){ print "Content-type: text/html\n\n"; print "

\n"; print "

\n"; } #------------------------------------------------------ elsif($pi eq "/xml-edit"){ open(XML, ">$xmlfile"); print XML $form{'xml'}; close(XML); @tasks = (); undef $/; open(F, $xmlfile); $f = (); &parse($f); &writexml(); print "Location: /hive-todo.cgi\n\n"; } #------------------------------------------------------ elsif($pi eq "/done"){ for $t (@tasks){ if($form{'withdesc'} eq $t->{description}){ $t->{completed} = time(); } } &writexml(); print "Location: /hive-todo.cgi\n\n"; } #------------------------------------------------------ else{ print "Content-type: text/html\n\n"; &printhtml(); } } flock(XML, 8); sub writexml { open(XML, ">$xmlfile"); my($t); for $t (@tasks){ print XML $t->toXML(); print XML "\n"; } close(XML); } sub printhtml { print "\n"; print "

Hive To Do List

\n"; print "

To do

"; print "\n"; print ""; for $t (@tasks){ $t->toHTML() if ($t->{completed} < 0); } print "

Person	Priority 1 = least important 5 = most important	Size	Description/comments	Entered	Finished!

\n"; print "

Finished

"; print "\n"; print ""; for $t (@tasks){ $t->toHTML() if ($t->{completed} >= 0); } print "

Person	Priority 1 = least important 5 = most important	Size	Description/comments	Entered	Completed

\n"; print "

[Add a task] [View XML] [Reload list]\n"; } sub characters { my($c) = @_; $charbuf .= $c; } sub element { my($el, $close, %attrs) = @_; if($intask){ if($indesc){ # If it's a close description tag, we're done if((lc($el) eq "description") && ($close)){ $description = $charbuf; $charbuf = ""; $indesc = 0; } # otherwise, put it in the charbuf else{ &dumpinbuf($el, $close, %attrs); } } elsif($incomment){ # If it's a close comment tag, store it away if((lc($el) eq "comment") && ($close)){ $curtask->addComment($charbuf, &pgetdate(&clean($commenttime))); push(@comments, $c); $incomment = 0; } # otherwise, put it in the charbuf else { &dumpinbuf($el, $close, %attrs); } } elsif(lc($el) eq "comment"){ if($close){ # Shouldn't be here, we'll dump it in the buffer &dumpinbuf($el, $close, %attrs); } else{ $charbuf = ""; $commenttime = $attrs{"added"}; $incomment = 1; } } elsif(lc($el) eq "description"){ if($close){ # Bad &dumpinbuf($el, $close, %attrs); } else { $charbuf = ""; $indesc = 1; } } elsif(lc($el) eq "task"){ if($close){ $curtask->{description} = $description; $description = ""; push(@tasks, $curtask); $intask = 0; } else{ # A subtask # Not yet handled &dumpinbuf($el, $close, %attrs); } } } elsif(lc($el) eq "task"){ $comptime = &pgetdate(&clean($attrs{"completed"})); $comptime += (5*60*60) if($comptime > 0); $curtask = new Task(&clean($attrs{"person"}), &clean($attrs{"priority"}), &clean($attrs{"size"}), (60*60*5)+&pgetdate(&clean($attrs{"added"})), $comptime, $description); $intask = 1; } } sub dumpinbuf { my($el, $close, %attrs) = @_; $cslash = ($close) ? "/":""; $charbuf .= "<$cslash$el "; for $k (keys %attrs){ $charbuf .= "$k = \"$attrs{$k}\" "; } chop($charbuf); $charbuf .= ">"; } sub clean { $str = shift; if($str =~ /^\".+\"$/){ chop $str; $str =substr($str, 1); } $str; } sub myctime { my($t) = @_; my($time) = &ctime($t); chop($time); $time; } #------------------------------------------------------------ # XML Parsing stuff #------------------------------------------------------------ sub parse { my($file) = @_; while ($file =~ /([^<]*)<(\/)?([^>]+)>/) { $st_or_et = $2; $gi = $3; $file = $'; $pretext = $1; # I recognize the following kinds of objects: XML declaration # (a particular type of processing instruction), processing # instructions, comments, doctype declaration, cdata marked # sections, and elements. Since the document production has # order rules I set a flag when a particlar type of object # has been processed. I invoke a subroutine to process each # type of object. if ($gi =~ /^\?XML/) { &process_decl; $decl_seen = 1; } elsif ($gi =~ /^\?/) { &process_pi; $misc_seen = 1; } elsif ($gi =~ /^!\-\-/) { &process_comment; $misc_seen; } elsif ($gi =~ /^!DOCTYPE/) { &process_doctype; $doctype_seen = 1; } elsif ($gi =~ /^\!\[CDATA\[/) { &process_cdata; } else { &process_element; $element_seen = 1; } } } #--------------------------------------------------------------------------# sub check_error_count { if ($error_count == 0) { print "This document appears to be well-formed.\n"; } } #--------------------------------------------------------------------------# # Check to see if the ancestor stack containing all parents up to the # root is empty. sub check_empty_stack { if ($#ancestors > -1) { &print_error_at_context; } } #--------------------------------------------------------------------------# # Check to see if there is any uncontained PCDATA lying around (white space # at the end of the document doesn't count). I check also to see that # a root to the document was found which catches a null file error. sub check_uncontained_pcdata { if ($file !~ /^\s*$/ || $ROOT eq "") { $error_count++; print "\nNot well formed uncontained #PCDATA or null file\n"; } } #--------------------------------------------------------------------------# # Check that the XML declaration is coded properly and in the correct # position (before any other object in the file and occuring only # once.) sub process_decl { if ($decl_seen || $misc_seen || $doctype_seen || $element_seen) { $error_count++; print "XML declaration can only be at the head of the document.\n"; } # No checks are performed on processing instructions but the following # will be used to store the PI in the $gi variable and advance the # file pointer. &process_pi; # This is slightly lazy since we allow version='1.0". It is quite simple # to fix just by making an OR of each parameter with either ' ' or " " # quote marks. if ($gi !~/\?XML\s+version=[\'\"]1.0[\'\"](\s+encoding=[\'\"][^\'\"]*[\'\"])? (\s+RMD=[\'\"](NONE|INTERNAL|ALL)[\'\"])?\s*\?/) { $error_count++; print "Format of XML declaration is wrong.\n"; } } #--------------------------------------------------------------------------# # Check that the Doctype statement is in the right position and, otherwise, # make no attempt to parse its contents, including the root element. The # root element will determined from the element production itself and # the "claim" of the Doctype won't be verified. sub process_doctype { if ($doctype_seen || $element_seen) { $error_count++; print "Doctype can only appear once and must be within prolog.\n"; } if ($gi =~ /\[/ && $gi !~ /\]$/) { $file =~ /\]>/; $file = $'; $gi = $gi.$`.$&; } } #--------------------------------------------------------------------------# # Performs the well-formed check necessary to verify that CDATA is not # nested. We will pick up the wrong end of CDATA marker if this is the # case so the error message is critical. sub process_cdata { if ($gi !~ /\]\]$/) { $file =~ /\]\]>/; $file = $'; $gi = $gi.$`."]]"; } $gi =~ /\!\[CDATA\[(.*)\]\]/; $body = $1; if ($body =~ /<\!\[CDATA\[/) { print "Nested CDATA.\n"; &print_error_at_context; } } #--------------------------------------------------------------------------# # Performs the well-formed check of ensuring that '--' is not nested # in the comment body which would cause problems for SGML processors. sub process_comment { if ($gi !~ /\-\-$/) { $file =~ /\-\->/; $file = $'; $gi = $gi.$`."--"; } $gi =~ /\!\-\-((.|\n)*)\-\-/; $body = $1; if ($body =~ /\-\-/) { $error_count++; print "Comment contains --.\n"; } } #--------------------------------------------------------------------------# # This is the main subroutine which handles the ancestor stack (in an # array) checking the proper nesting of the element part of the document # production. sub process_element { &characters($pretext); # Distinguish between empty elements which do not add a parent to the # ancestor stack and elements which can have content. if ($gi =~ /\/$/) { $xml_empty = 1; $gi =~ s/\/$//; # XML well-formedness says every document must have a container so an # empty element cannot be the root, even if it is the only element in # the document. if (!$element_seen) { print "Empty element <$gi/> cannot be the root.\n"; } } else { $xml_empty = 0; } # Check to see that attributes are well-formed. my(%attrs) = (); if ($gi =~ /\s/) { $gi = $`; $attrline = $'; $attrs = $attrline; # This time we properly check to see that either ' ' or " " is # used to surround the attribute values. while ($attrs =~ /\s*([^\s=]*)\s*=\s*(("[^"]*")|('[^']*'))/) { # An end tag may not, of course, have attributes. $attrs{$1} = $2; if ($st_or_et eq "\/") { print "Attributes may not be placed on end tags.\n"; &print_error_at_context; } $attrname = $1; # Check for a valid attribute name. &check_name($attrname); $attrs = $'; } $attrs =~ s/\s//g; # The above regex should have processed all the attributes. If anything # is left after getting rid of white space it is because the attribute # expressesion was malformed. if ($attrs ne "") { print "Malformed attributes.\n"; &print_error_at_context; } } # If XML is declared case-sensitive the following line should be # removed. At the moment it isn't so I set everything to lower # case so we can match start and end tags irrespective of case # differences. $gi =~ tr/A-Z/a-z/; if (!$element_seen) { $ROOT = $gi; } # Check to see that the generic identifier is a well-formed name. &check_name($gi); # If I have an end tag I just check the top of the stack, the # end tag must match the last parent or it is an error. If I # find an error I have I could either pop or not pop the stack. # What I want is to perform some manner of error recovery so # I can continue to report well-formed errors on the rest of # the document. If I pop the stack and my problem was caused # by a missing end tag I will end up reporting errors on every # tag thereafter. If I don't pop the stack and the problem # was caused by a misspelled end tag name I will also report # errors on every following tag. I happened to chose the latter. if ($st_or_et eq "\/") { $parent = $ancestors[$#ancestors]; if ($parent ne $gi) { if (@ancestors eq $ROOT) { @ancestors = ""; } else { &print_error_at_context; } } else { pop @ancestors; } &element($gi, 1, %attrs); } else { # This is either an empty tag or a start tag. In the latter case # push the generic identifier onto the ancestor stack. &element($gi, 0, %attrs); if (!$xml_empty) { push (@ancestors, $gi); } } } #--------------------------------------------------------------------------# # Skip over processing instructions. sub process_pi { if ($gi !~ /\?$/) { $file =~ /\?>/; $gi = $gi.$`."?"; $file = $'; } } #--------------------------------------------------------------------------# sub print_error_at_context { # This routine prints out an error message with the contents of the # ancestor stack so the context of the error can be identified. # It would be most helpful to have line numbers. In principle it # is possible but more difficult since we choose to not process the # document line by line. We could still count line break characters # as we scan the document. # Nesting errors can cause every tag thereafter to generate an error # so stop at 10. if ($error_count == 10) { print "More than 10 errors ...\n"; $error_count++; } else { $error_count++; print "Not well formed at context "; # Just cycle through the ancestor stack. foreach $element (@ancestors) { print "$first$element"; $first = "->"; } $first = ""; print " tag: <$st_or_et$gi $attrline>\n"; } } #--------------------------------------------------------------------------# # Check for a well-formed Name as defined in the Name production. sub check_name { local($name) = @_; if ($name !~ /^[A-Za-z_:][\w\.\-:]*$/) { print "Invalid element or attribute name: $name\n"; &print_error_at_context; } } #--------------------- package Task; sub new { my($this, $person, $priority, $size, $added, $completed, $description) = @_; return bless { 'person' => $person, 'priority' => $priority, 'size' => $size, 'added' => $added, 'completed' => $completed, 'description' => $description, 'comments' => [] }; } sub print { $this = @_; print "___Task___\n"; print $this->{description}."\n\t"; print "p/p/s ".$this->{person}." ".$this->{priority}." ".$this->{size}."\n\t"; print "a/c ".$this->{added}." ".$this->{completed}."\n\t"; } sub toHTML { my($this) = @_; $personcolor = "white"; $personcolor = $main::colormap{$this->{person}} if $main::colormap{$this->{person}}; print "".$this->{person}."\n".$main::prword[int($this->{priority})]."\n".$main::szword[$this->{size}]."\n"; @comments = @{$this->{comments}}; $comments = ""; for $c (@comments) { $comments .= "

".$c->{comment}."

".&main::myctime($c->{time})."

\n"; } print "".$this->{description}."\n".$comments."\n"; print "".&main::myctime($this->{added})."\n"; if ($this->{completed} > 0){ print "".&main::myctime($this->{completed})."\n"; } else{ $doneqs = &urlescape($this->{description}); print "Done\n"; } print "\n"; } sub urlescape { my($v) = @_; $v =~ s/([^a-zA-Z])/"%".unpack("H2", $1)/eg; $v; } sub toXML { my($this) = @_; my($ret); $ret = "{person}\" "; $ret .= "priority=\"$this->{priority}\"\n"; $ret .= "size=\"$this->{size}\" "; $ret .= "added=\"".&main::myctime($this->{added})."\"\n"; if($this->{completed} >= 0){ $ret .= "completed=\"".&main::myctime($this->{completed})."\""; } else{ $ret .= "completed=\"\""; } $ret.= ">\n"; $ret .= "$this->{description}\n"; @comments = @{$this->{comments}}; for $c (@comments) { $ret .= "{time})."\">".$c->{comment}.""; } $ret .= "\n"; $ret; } sub addComment { my($self, $comment, $when) = @_; push(@{$self->{comments}}, Comment->new($comment, $when)); } 1; package Comment; sub new { my($this, $c, $t) = @_; return bless { 'comment' => $c, 'time' => $t }; }