You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
470 lines
17 KiB
470 lines
17 KiB
12 years ago
|
<?php // $Id: importppt.php,v 1.1.2.2 2010/07/24 02:46:16 arborrow Exp $
|
||
|
/**
|
||
|
* This is a very rough importer for powerpoint slides
|
||
|
* Export a powerpoint presentation with powerpoint as html pages
|
||
|
* Do it with office 2002 (I think?) and no special settings
|
||
|
* Then zip the directory with all of the html pages
|
||
|
* and the zip file is what you want to upload
|
||
|
*
|
||
|
* The script supports book and lesson.
|
||
|
*
|
||
|
* @version $Id: importppt.php,v 1.1.2.2 2010/07/24 02:46:16 arborrow Exp $
|
||
|
* @license http://www.gnu.org/copyleft/gpl.html GNU Public License
|
||
|
* @package lesson
|
||
|
**/
|
||
|
|
||
|
require_once("../../config.php");
|
||
|
require_once("locallib.php");
|
||
|
|
||
|
$id = required_param('id', PARAM_INT); // Course Module ID
|
||
|
$pageid = optional_param('pageid', '', PARAM_INT); // Page ID
|
||
|
global $matches;
|
||
|
|
||
|
if (! $cm = get_coursemodule_from_id('lesson', $id)) {
|
||
|
error("Course Module ID was incorrect");
|
||
|
}
|
||
|
|
||
|
if (! $course = get_record("course", "id", $cm->course)) {
|
||
|
error("Course is misconfigured");
|
||
|
}
|
||
|
|
||
|
// allows for adaption for multiple modules
|
||
|
if(! $modname = get_field('modules', 'name', 'id', $cm->module)) {
|
||
|
error("Could not find module name");
|
||
|
}
|
||
|
|
||
|
if (! $mod = get_record($modname, "id", $cm->instance)) {
|
||
|
error("Course module is incorrect");
|
||
|
}
|
||
|
|
||
|
require_login($course->id, false);
|
||
|
$context = get_context_instance(CONTEXT_MODULE, $cm->id);
|
||
|
require_capability('mod/lesson:edit', $context);
|
||
|
|
||
|
$strimportppt = get_string("importppt", "lesson");
|
||
|
$strlessons = get_string("modulenameplural", "lesson");
|
||
|
|
||
|
print_header_simple("$strimportppt", " $strimportppt",
|
||
|
"<a href=\"index.php?id=$course->id\">$strlessons</a> -> <a href=\"$CFG->wwwroot/mod/$modname/view.php?id=$cm->id\">".format_string($mod->name,true)."</a>-> $strimportppt");
|
||
|
|
||
|
if ($form = data_submitted()) { /// Filename
|
||
|
|
||
|
if (empty($_FILES['newfile'])) { // file was just uploaded
|
||
|
notify(get_string("uploadproblem") );
|
||
|
}
|
||
|
|
||
|
if ((!is_uploaded_file($_FILES['newfile']['tmp_name']) or $_FILES['newfile']['size'] == 0)) {
|
||
|
notify(get_string("uploadnofilefound") );
|
||
|
|
||
|
} else { // Valid file is found
|
||
|
|
||
|
if ($rawpages = readdata($_FILES, $course->id, $modname))
|
||
|
{ // first try to reall all of the data in
|
||
|
$pageobjects = extract_data($rawpages, $course->id, $mod->name, $modname); // parse all the html files into objects
|
||
|
clean_temp(); // all done with files so dump em
|
||
|
|
||
|
$mod_create_objects = $modname.'_create_objects';
|
||
|
$mod_save_objects = $modname.'_save_objects';
|
||
|
|
||
|
$objects = $mod_create_objects($pageobjects, $mod->id); // function to preps the data to be sent to DB
|
||
|
|
||
|
if(! $mod_save_objects($objects, $mod->id, $pageid)) { // sends it to DB
|
||
|
error("could not save");
|
||
|
}
|
||
|
} else {
|
||
|
error('could not get data');
|
||
|
}
|
||
|
|
||
|
echo "<hr>";
|
||
|
print_continue("$CFG->wwwroot/mod/$modname/view.php?id=$cm->id");
|
||
|
print_footer($course);
|
||
|
exit;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
/// Print upload form
|
||
|
|
||
|
print_heading_with_help($strimportppt, "importppt", "lesson");
|
||
|
|
||
|
print_simple_box_start("center");
|
||
|
echo "<form id=\"theform\" enctype=\"multipart/form-data\" method=\"post\">";
|
||
|
echo "<input type=\"hidden\" name=\"id\" value=\"$cm->id\" />\n";
|
||
|
echo "<input type=\"hidden\" name=\"pageid\" value=\"$pageid\" />\n";
|
||
|
echo "<table cellpadding=\"5\">";
|
||
|
|
||
|
echo "<tr><td align=\"right\">";
|
||
|
print_string("upload");
|
||
|
echo ":</td><td>";
|
||
|
echo "<input name=\"newfile\" type=\"file\" size=\"50\" />";
|
||
|
echo "</td></tr><tr><td> </td><td>";
|
||
|
echo "<input type=\"submit\" name=\"save\" value=\"".get_string("uploadthisfile")."\" />";
|
||
|
echo "</td></tr>";
|
||
|
|
||
|
echo "</table>";
|
||
|
echo "</form>";
|
||
|
print_simple_box_end();
|
||
|
|
||
|
print_footer($course);
|
||
|
|
||
|
// START OF FUNCTIONS
|
||
|
|
||
|
function readdata($file, $courseid, $modname) {
|
||
|
// this function expects a zip file to be uploaded. Then it parses
|
||
|
// outline.htm to determine the slide path. Then parses each
|
||
|
// slide to get data for the content
|
||
|
|
||
|
global $CFG;
|
||
|
|
||
|
// create an upload directory in temp
|
||
|
make_upload_directory('temp/'.$modname);
|
||
|
|
||
|
$base = $CFG->dataroot."/temp/$modname/";
|
||
|
|
||
|
$zipfile = $_FILES["newfile"]["name"];
|
||
|
$tempzipfile = $_FILES["newfile"]["tmp_name"];
|
||
|
|
||
|
// create our directory
|
||
|
$path_parts = pathinfo($zipfile);
|
||
|
$dirname = substr($zipfile, 0, strpos($zipfile, '.'.$path_parts['extension'])); // take off the extension
|
||
|
if (!file_exists($base.$dirname)) {
|
||
|
mkdir($base.$dirname);
|
||
|
}
|
||
|
|
||
|
// move our uploaded file to temp/lesson
|
||
|
move_uploaded_file($tempzipfile, $base.$zipfile);
|
||
|
|
||
|
// unzip it!
|
||
|
unzip_file($base.$zipfile, $base, false);
|
||
|
|
||
|
$base = $base.$dirname; // update the base
|
||
|
|
||
|
// this is the file where we get the names of the files for the slides (in the correct order too)
|
||
|
$outline = $base.'/outline.htm';
|
||
|
|
||
|
$pages = array();
|
||
|
|
||
|
if (file_exists($outline) and is_readable($outline)) {
|
||
|
$outlinecontents = file_get_contents($outline);
|
||
|
$filenames = array();
|
||
|
preg_match_all("/javascript:GoToSld\('(.*)'\)/", $outlinecontents, $filenames); // this gets all of our files names
|
||
|
|
||
|
// file $pages with the contents of all of the slides
|
||
|
foreach ($filenames[1] as $file) {
|
||
|
$path = $base.'/'.$file;
|
||
|
if (is_readable($path)) {
|
||
|
$pages[$path] = file_get_contents($path);
|
||
|
} else {
|
||
|
return false;
|
||
|
}
|
||
|
}
|
||
|
} else {
|
||
|
// cannot find the outline, so grab all files that start with slide
|
||
|
$dh = opendir($base);
|
||
|
while (false !== ($file = readdir($dh))) { // read throug the directory
|
||
|
if ('slide' == substr($file, 0, 5)) { // check for name (may want to check extension later)
|
||
|
$path = $base.'/'.$file;
|
||
|
if (is_readable($path)) {
|
||
|
$pages[$path] = file_get_contents($path);
|
||
|
} else {
|
||
|
return false;
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
|
||
|
ksort($pages); // order them by file name
|
||
|
}
|
||
|
|
||
|
if (empty($pages)) {
|
||
|
return false;
|
||
|
}
|
||
|
|
||
|
return $pages;
|
||
|
}
|
||
|
|
||
|
function extract_data($pages, $courseid, $lessonname, $modname) {
|
||
|
// this function attempts to extract the content out of the slides
|
||
|
// the slides are ugly broken xml. and the xml is broken... yeah...
|
||
|
|
||
|
global $CFG;
|
||
|
global $matches;
|
||
|
|
||
|
$extratedpages = array();
|
||
|
|
||
|
// directory for images
|
||
|
make_mod_upload_directory($courseid); // make sure moddata is made
|
||
|
make_upload_directory($courseid.'/moddata/'.$modname, false); // we store our images in a subfolder in here
|
||
|
|
||
|
$imagedir = $CFG->dataroot.'/'.$courseid.'/moddata/'.$modname;
|
||
|
|
||
|
if ($CFG->slasharguments) {
|
||
|
$imagelink = $CFG->wwwroot.'/file.php/'.$courseid.'/moddata/'.$modname;
|
||
|
} else {
|
||
|
$imagelink = $CFG->wwwroot.'/file.php?file=/'.$courseid.'/moddata/'.$modname;
|
||
|
}
|
||
|
|
||
|
// try to make a unique subfolder to store the images
|
||
|
$lessonname = str_replace(' ', '_', $lessonname); // get rid of spaces
|
||
|
$i = 0;
|
||
|
while(true) {
|
||
|
if (!file_exists($imagedir.'/'.$lessonname.$i)) {
|
||
|
// ok doesnt exist so make the directory and update our paths
|
||
|
mkdir($imagedir.'/'.$lessonname.$i);
|
||
|
$imagedir = $imagedir.'/'.$lessonname.$i;
|
||
|
$imagelink = $imagelink.'/'.$lessonname.$i;
|
||
|
break;
|
||
|
}
|
||
|
$i++;
|
||
|
}
|
||
|
|
||
|
foreach ($pages as $file => $content) {
|
||
|
// to make life easier on our preg_match_alls, we strip out all tags except
|
||
|
// for div and img (where our content is). We want div because sometimes we
|
||
|
// can identify the content in the div based on the div's class
|
||
|
|
||
|
$tags = '<div><img>'; // should also allow <b><i>
|
||
|
$string = strip_tags($content,$tags);
|
||
|
//echo s($string);
|
||
|
|
||
|
$matches = array();
|
||
|
// this will look for a non nested tag that is closed
|
||
|
// want to allow <b><i>(maybe more) tags but when we do that
|
||
|
// the preg_match messes up.
|
||
|
preg_match_all("/(<([\w]+)[^>]*>)([^<\\2>]*)(<\/\\2>)/", $string, $matches);
|
||
|
//(<([\w]+)[^>]*>)([^<\\2>]*)(<\/\\2>) original pattern
|
||
|
//(<(div+)[^>]*>)[^(<div*)](<\/div>) work in progress
|
||
|
|
||
|
$path_parts = pathinfo($file);
|
||
|
$file = substr($path_parts['basename'], 0, strpos($path_parts['basename'], '.')); // get rid of the extension
|
||
|
|
||
|
$imgs = array();
|
||
|
// this preg matches all images
|
||
|
preg_match_all("/<img[^>]*(src\=\"(".$file."\_image[^>^\"]*)\"[^>]*)>/i", $string, $imgs);
|
||
|
|
||
|
// start building our page
|
||
|
$page = new stdClass;
|
||
|
$page->title = '';
|
||
|
$page->contents = array();
|
||
|
$page->images = array();
|
||
|
$page->source = $path_parts['basename']; // need for book only
|
||
|
|
||
|
// this foreach keeps the style intact. Found it doesn't help much. But if you want back uncomment
|
||
|
// this foreach and uncomment the line with the comment imgstyle in it. Also need to comment out
|
||
|
// the $page->images[]... line in the next foreach
|
||
|
/*foreach ($imgs[1] as $img) {
|
||
|
$page->images[] = '<img '.str_replace('src="', "src=\"$imagelink/", $img).' />';
|
||
|
}*/
|
||
|
foreach ($imgs[2] as $img) {
|
||
|
copy($path_parts['dirname'].'/'.$img, $imagedir.'/'.$img);
|
||
|
$page->images[] = "<img src=\"$imagelink/$img\" title=\"$img\" />"; // comment out this line if you are using the above foreach loop
|
||
|
}
|
||
|
for($i = 0; $i < count($matches[1]); $i++) { // go through all of our div matches
|
||
|
|
||
|
$class = isolate_class($matches[1][$i]); // first step in isolating the class
|
||
|
|
||
|
// check for any static classes
|
||
|
switch ($class) {
|
||
|
case 'T': // class T is used for Titles
|
||
|
$page->title = $matches[3][$i];
|
||
|
break;
|
||
|
case 'B': // I would guess that all bullet lists would start with B then go to B1, B2, etc
|
||
|
case 'B1': // B1-B4 are just insurance, should just hit B and all be taken care of
|
||
|
case 'B2':
|
||
|
case 'B3':
|
||
|
case 'B4':
|
||
|
$page->contents[] = build_list('<ul>', $i, 0); // this is a recursive function that will grab all the bullets and rebuild the list in html
|
||
|
break;
|
||
|
default:
|
||
|
if ($matches[3][$i] != ' ') { // odd crap generated... sigh
|
||
|
if (substr($matches[3][$i], 0, 1) == ':') { // check for leading : ... hate MS ...
|
||
|
$page->contents[] = substr($matches[3][$i], 1); // get rid of :
|
||
|
} else {
|
||
|
$page->contents[] = $matches[3][$i];
|
||
|
}
|
||
|
}
|
||
|
break;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
// add the page to the array;
|
||
|
$extratedpages[] = $page;
|
||
|
|
||
|
} // end $pages foreach loop
|
||
|
|
||
|
return $extratedpages;
|
||
|
}
|
||
|
|
||
|
/**
|
||
|
A recursive function to build a html list
|
||
|
*/
|
||
|
function build_list($list, &$i, $depth) {
|
||
|
global $matches; // not sure why I global this...
|
||
|
|
||
|
while($i < count($matches[1])) {
|
||
|
|
||
|
$class = isolate_class($matches[1][$i]);
|
||
|
|
||
|
if (strstr($class, 'B')) { // make sure we are still working with bullet classes
|
||
|
if ($class == 'B') {
|
||
|
$this_depth = 0; // calling class B depth 0
|
||
|
} else {
|
||
|
// set the depth number. So B1 is depth 1 and B2 is depth 2 and so on
|
||
|
$this_depth = substr($class, 1);
|
||
|
if (!is_numeric($this_depth)) {
|
||
|
error("Depth not parsed!");
|
||
|
}
|
||
|
}
|
||
|
if ($this_depth < $depth) {
|
||
|
// we are moving back a level in the nesting
|
||
|
break;
|
||
|
}
|
||
|
if ($this_depth > $depth) {
|
||
|
// we are moving in a lvl in nesting
|
||
|
$list .= '<ul>';
|
||
|
$list = build_list($list, $i, $this_depth);
|
||
|
// once we return back, should go to the start of the while
|
||
|
continue;
|
||
|
}
|
||
|
// no depth changes, so add the match to our list
|
||
|
if ($cleanstring = ppt_clean_text($matches[3][$i])) {
|
||
|
$list .= '<li>'.ppt_clean_text($matches[3][$i]).'</li>';
|
||
|
}
|
||
|
$i++;
|
||
|
} else {
|
||
|
// not a B class, so get out of here...
|
||
|
break;
|
||
|
}
|
||
|
}
|
||
|
// end the list and return it
|
||
|
$list .= '</ul>';
|
||
|
return $list;
|
||
|
|
||
|
}
|
||
|
|
||
|
/**
|
||
|
Given an html tag, this function will
|
||
|
*/
|
||
|
function isolate_class($string) {
|
||
|
if($class = strstr($string, 'class=')) { // first step in isolating the class
|
||
|
$class = substr($class, strpos($class, '=')+1); // this gets rid of <div blawblaw class= there are no "" or '' around the class name ...sigh...
|
||
|
if (strstr($class, ' ')) {
|
||
|
// spaces found, so cut off everything off after the first space
|
||
|
return substr($class, 0, strpos($class, ' '));
|
||
|
} else {
|
||
|
// no spaces so nothing else in the div tag, cut off the >
|
||
|
return substr($class, 0, strpos($class, '>'));
|
||
|
}
|
||
|
} else {
|
||
|
// no class defined in the tag
|
||
|
return '';
|
||
|
}
|
||
|
}
|
||
|
|
||
|
/**
|
||
|
This function strips off the random chars that ppt puts infront of bullet lists
|
||
|
*/
|
||
|
function ppt_clean_text($string) {
|
||
|
$chop = 1; // default: just a single char infront of the content
|
||
|
|
||
|
// look for any other crazy things that may be infront of the content
|
||
|
if (strstr($string, '<') and strpos($string, '<') == 0) { // look for the < in the sting and make sure it is in the front
|
||
|
$chop = 4; // increase the $chop
|
||
|
}
|
||
|
// may need to add more later....
|
||
|
|
||
|
$string = substr($string, $chop);
|
||
|
|
||
|
if ($string != ' ') {
|
||
|
return $string;
|
||
|
} else {
|
||
|
return false;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
/**
|
||
|
Clean up the temp directory
|
||
|
*/
|
||
|
function clean_temp() {
|
||
|
global $CFG;
|
||
|
// this function is broken, use it to clean up later
|
||
|
// should only clean up what we made as well because someone else could be importing ppt as well
|
||
|
//delDirContents($CFG->dataroot.'/temp/lesson');
|
||
|
}
|
||
|
|
||
|
|
||
|
/**
|
||
|
Creates objects an chapter object that is to be inserted into the database
|
||
|
*/
|
||
|
function book_create_objects($pageobjects, $bookid) {
|
||
|
|
||
|
$chapters = array();
|
||
|
$chapter = new stdClass;
|
||
|
|
||
|
// same for all chapters
|
||
|
$chapter->bookid = $bookid;
|
||
|
$chapter->pagenum = count_records('book_chapters', 'bookid', $bookid)+1;
|
||
|
$chapter->timecreated = time();
|
||
|
$chapter->timemodified = time();
|
||
|
$chapter->subchapter = 0;
|
||
|
|
||
|
$i = 1;
|
||
|
foreach ($pageobjects as $pageobject) {
|
||
|
$page = prep_page($pageobject, $i); // get title and contents
|
||
|
$chapter->importsrc = addslashes($pageobject->source); // add the source
|
||
|
$chapter->title = $page->title;
|
||
|
$chapter->content = $page->contents;
|
||
|
$chapters[] = $chapter;
|
||
|
|
||
|
// increment our page number and our counter
|
||
|
$chapter->pagenum = $chapter->pagenum + 1;
|
||
|
$i++;
|
||
|
}
|
||
|
|
||
|
return $chapters;
|
||
|
}
|
||
|
|
||
|
/**
|
||
|
Builds the title and content strings from an object
|
||
|
*/
|
||
|
function prep_page($pageobject, $count) {
|
||
|
if ($pageobject->title == '') {
|
||
|
$page->title = "Page $count"; // no title set so make a generic one
|
||
|
} else {
|
||
|
$page->title = addslashes($pageobject->title);
|
||
|
}
|
||
|
|
||
|
$page->contents = '';
|
||
|
|
||
|
// nab all the images first
|
||
|
foreach ($pageobject->images as $image) {
|
||
|
$image = str_replace("\n", '', $image);
|
||
|
$image = str_replace("\r", '', $image);
|
||
|
$image = str_replace("'", '"', $image); // imgstyle
|
||
|
|
||
|
$page->contents .= addslashes($image);
|
||
|
}
|
||
|
// go through the contents array and put <p> tags around each element and strip out \n which I have found to be uneccessary
|
||
|
foreach ($pageobject->contents as $content) {
|
||
|
$content = str_replace("\n", '', $content);
|
||
|
$content = str_replace("\r", '', $content);
|
||
|
$content = str_replace(' ', '', $content); // puts in returns?
|
||
|
$content = '<p>'.$content.'</p>';
|
||
|
$page->contents .= addslashes($content);
|
||
|
}
|
||
|
return $page;
|
||
|
}
|
||
|
|
||
|
/**
|
||
|
Save the chapter objects to the database
|
||
|
*/
|
||
|
function book_save_objects($chapters, $bookid, $pageid='0') {
|
||
|
// nothing fancy, just save them all in order
|
||
|
foreach ($chapters as $chapter) {
|
||
|
if (!$chapter->id = insert_record('book_chapters', $chapter)) {
|
||
|
error('Could not update your book');
|
||
|
}
|
||
|
}
|
||
|
return true;
|
||
|
}
|
||
|
|
||
|
?>
|