python 把word转html:上传页面
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml">
<head>
<meta http-equiv="Content-Type" content="text/html; charset=gb2312" />
<title>文件上传</title>
</head>
<body>
<form action="receivefile.php" method="post" enctype="multipart/form-data">
<input type="file" name="filename" />
<input type="submit" />
</form>
</body>
</html>
接收页面
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml">
<head>
<meta http-equiv="Content-Type" content="text/html; charset=gb2312" />
<title>接收上传文件</title>
<?php
$conn = @new COM("ADODB.Connection");
$connstr = "DRIVER={Microsoft Access Driver (*.mdb)}; DBQ=" . realpath("person.mdb");
$conn->Open($connstr);
$uploaddir = 'uploads/';
if(!is_dir($uploaddir)){
mkdir($uploaddir);
}
$filename =$_FILES['filename']['name'];
$filename =substr($_FILES['filename']["name"],0,strpos($_FILES['filename']["name"],"."));
echo $filename;
echo "<br>";
$uploadfile = $uploaddir.$filename.substr($_FILES['filename']["name"],strpos($_FILES['filename']["name"],".")); //目录名.文件名.后缀名
echo $uploadfile;
echo "<br>";
$temploadfile = $_FILES['filename']['tmp_name'];
echo $temploadfile;
echo "<br>";
move_uploaded_file($temploadfile , $uploadfile); //移动文件
$path = $_SERVER['SCRIPT_FILENAME'];
$filepath = $_SERVER["PHP_SELF"];
$path = substr($path,0,strpos($path,$filepath));
echo $path;
echo "<br>";
echo $filepath;
$htmlpath = $path."/shiyan4/".$uploadfile;
echo "<br>";
echo $htmlpath;
word2html($htmlpath);
//$query =@mysql_query( "Insert into $username(fname,file)values('$filename','$uploadfile')")or die("error");
?>
<?php
//http://tieba.baidu.com/f?kz=13975389
function word2html($wfilepath)
{
$word=new COM("Word.Application") or die("无法打开 MS Word");
$word->visible = 1 ;
$word->Documents->Open($wfilepath)or die("无法打开这个文件");
$htmlpath=substr($wfilepath,0,-4);
$word->ActiveDocument->SaveAs($htmlpath,8);
$word->quit(0);
}
print( "Word转html完成!" );
?>
</head>
<body>
</body>
</html>
saveas后面的数字代表要转换的格式,参考:http://msdn.microsoft.com/zh-cn/library/microsoft.office.interop.word.wdsaveformat.aspx
http://jingyan.baidu.com/article/a3761b2b8ed03c1577f9aa60.html
http://msdn.microsoft.com/zh-cn/library/ff194352(v=office.15).aspx
http://stackoverflow.com/questions/10366596/reading-table-contetnts-in-ms-word-file-using-python
http://msdn.microsoft.com/zh-cn/library/ff837519.aspx
http://www.cnblogs.com/oracleblogs/p/3387436.html
http://my.oschina.net/kakablue/blog/170361
http://www.cnblogs.com/rongyilin/archive/2012/12/21/2828007.html
html5:
http://www.starming.com/index.php?action=plugin&v=wave&tpl=union&ac=viewgrouppost&gid=34464&tid=17975