'; // should also allow $string = strip_tags($content,$tags); //echo s($string); $matches = array(); // this will look for a non nested tag that is closed // want to allow (maybe more) tags but when we do that // the preg_match messes up. preg_match_all("/(<([\w]+)[^>]*>)([^<\\2>]*)(<\/\\2>)/", $string, $matches); //(<([\w]+)[^>]*>)([^<\\2>]*)(<\/\\2>) original pattern //(<(div+)[^>]*>)[^() work in progress $path_parts = pathinfo($file); $file = substr($path_parts['basename'], 0, strpos($path_parts['basename'], '.')); // get rid of the extension $imgs = array(); // this preg matches all images preg_match_all("/]*(src\=\"(".$file."\_image[^>^\"]*)\"[^>]*)>/i", $string, $imgs); // start building our page $page = new stdClass; $page->title = ''; $page->contents = array(); $page->images = array(); $page->source = $path_parts['basename']; // need for book only // this foreach keeps the style intact. Found it doesn't help much. But if you want back uncomment // this foreach and uncomment the line with the comment imgstyle in it. Also need to comment out // the $page->images[]... line in the next foreach /*foreach ($imgs[1] as $img) { $page->images[] = ''; }*/ foreach ($imgs[2] as $img) { copy($path_parts['dirname'].'/'.$img, $imagedir.'/'.$img); $page->images[] = " $\"$img\"$ "; // comment out this line if you are using the above foreach loop } for($i = 0; $i < count($matches[1]); $i++) { // go through all of our div matches $class = isolate_class($matches[1][$i]); // first step in isolating the class // check for any static classes switch ($class) { case 'T': // class T is used for Titles $page->title = $matches[3][$i]; break; case 'B': // I would guess that all bullet lists would start with B then go to B1, B2, etc case 'B1': // B1-B4 are just insurance, should just hit B and all be taken care of case 'B2': case 'B3': case 'B4': $page->contents[] = build_list('
', $i, 0); // this is a recursive function that will grab all the bullets and rebuild the list in html break; default: if ($matches[3][$i] != ' ') { // odd crap generated... sigh if (substr($matches[3][$i], 0, 1) == ':') { // check for leading : ... hate MS ... $page->contents[] = substr($matches[3][$i], 1); // get rid of : } else { $page->contents[] = $matches[3][$i]; } } break; } } // add the page to the array; $extratedpages[] = $page; } // end $pages foreach loop return $extratedpages; } /** A recursive function to build a html list */ function build_list($list, &$i, $depth) { global $matches; // not sure why I global this... while($i < count($matches[1])) { $class = isolate_class($matches[1][$i]); if (strstr($class, 'B')) { // make sure we are still working with bullet classes if ($class == 'B') { $this_depth = 0; // calling class B depth 0 } else { // set the depth number. So B1 is depth 1 and B2 is depth 2 and so on $this_depth = substr($class, 1); if (!is_numeric($this_depth)) { print_error( 'Depth not parsed!'); } } if ($this_depth < $depth) { // we are moving back a level in the nesting break; } if ($this_depth > $depth) { // we are moving in a lvl in nesting $list .= '
'; $list = build_list($list, $i, $this_depth); // once we return back, should go to the start of the while continue; } // no depth changes, so add the match to our list if ($cleanstring = ppt_clean_text($matches[3][$i])) { $list .= '
'.ppt_clean_text($matches[3][$i]).'
'; } $i++; } else { // not a B class, so get out of here... break; } } // end the list and return it $list .= '
'; return $list; } /** Given an html tag, this function will */ function isolate_class($string) { if($class = strstr($string, 'class=')) { // first step in isolating the class $class = substr($class, strpos($class, '=')+1); // this gets rid of
return substr($class, 0, strpos($class, '>')); } } else { // no class defined in the tag return ''; } } /** This function strips off the random chars that ppt puts infront of bullet lists */ function ppt_clean_text($string) { $chop = 1; // default: just a single char infront of the content // look for any other crazy things that may be infront of the content if (strstr($string, '<') and strpos($string, '<') == 0) { // look for the < in the sting and make sure it is in the front $chop = 4; // increase the $chop } // may need to add more later.... $string = substr($string, $chop); if ($string != ' ') { return $string; } else { return false; } } /** Clean up the temp directory */ function clean_temp() { global $CFG; // this function is broken, use it to clean up later // should only clean up what we made as well because someone else could be importing ppt as well //delDirContents($CFG->dataroot.'/temp/lesson'); } /** Creates objects an chapter object that is to be inserted into the database */ function book_create_objects($pageobjects, $bookid) { $chapters = array(); $chapter = new stdClass; // same for all chapters $chapter->bookid = $bookid; $chapter->pagenum = $DB->count_records('book_chapters', array( 'bookid' => $bookid))+1; $chapter->timecreated = time(); $chapter->timemodified = time(); $chapter->subchapter = 0; $i = 1; foreach ($pageobjects as $pageobject) { $page = prep_page($pageobject, $i); // get title and contents $chapter->importsrc = addslashes($pageobject->source); // add the source $chapter->title = $page->title; $chapter->content = $page->contents; $chapters[] = $chapter; // increment our page number and our counter $chapter->pagenum = $chapter->pagenum + 1; $i++; } return $chapters; } /** Builds the title and content strings from an object */ function prep_page($pageobject, $count) { if ($pageobject->title == '') { $page->title = "Page $count"; // no title set so make a generic one } else { $page->title = addslashes($pageobject->title); } $page->contents = ''; // nab all the images first foreach ($pageobject->images as $image) { $image = str_replace("\n", '', $image); $image = str_replace("\r", '', $image); $image = str_replace("'", '"', $image); // imgstyle $page->contents .= addslashes($image); } // go through the contents array and put
tags around each element and strip out \n which I have found to be uneccessary foreach ($pageobject->contents as $content) { $content = str_replace("\n", '', $content); $content = str_replace("\r", '', $content); $content = str_replace(' ', '', $content); // puts in returns? $content = '
'.$content.'
'; $page->contents .= addslashes($content); } return $page; } /** Save the chapter objects to the database */ function book_save_objects($chapters, $bookid, $pageid='0') { global $DB; // nothing fancy, just save them all in order foreach ($chapters as $chapter) { if (!$chapter->id = $DB->insert_record('book_chapters', $chapter)) { print_error('Could not update your book'); } } return true; }

"; print_string("upload"); echo ":	"; echo ""; echo "
	"; echo ""; echo "