python word操作深入

python 把word转html:上传页面
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml">
<head>
<meta http-equiv="Content-Type" content="text/html; charset=gb2312" />
<title>文件上传</title>
</head>

<body>
    <form action="receivefile.php" method="post" enctype="multipart/form-data">
    <input type="file" name="filename" />
    <input type="submit" />
    </form>
</body>
</html>

接收页面

<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml">
<head>
<meta http-equiv="Content-Type" content="text/html; charset=gb2312" />
<title>接收上传文件</title>

<?php

    $conn = @new COM("ADODB.Connection");
    $connstr = "DRIVER={Microsoft Access Driver (*.mdb)}; DBQ=" . realpath("person.mdb");
    $conn->Open($connstr);

$uploaddir = 'uploads/';
if(!is_dir($uploaddir)){
    mkdir($uploaddir);
}
$filename =$_FILES['filename']['name'];
$filename =substr($_FILES['filename']["name"],0,strpos($_FILES['filename']["name"],"."));
echo $filename;
echo "<br>";
$uploadfile = $uploaddir.$filename.substr($_FILES['filename']["name"],strpos($_FILES['filename']["name"],".")); //目录名.文件名.后缀名
echo $uploadfile;
echo "<br>";
$temploadfile = $_FILES['filename']['tmp_name'];
echo $temploadfile;
echo "<br>";
move_uploaded_file($temploadfile , $uploadfile); //移动文件
$path = $_SERVER['SCRIPT_FILENAME'];
$filepath = $_SERVER["PHP_SELF"];
$path = substr($path,0,strpos($path,$filepath));
echo $path;
echo "<br>";
echo $filepath;
$htmlpath = $path."/shiyan4/".$uploadfile;
echo "<br>";
echo $htmlpath;
word2html($htmlpath);
//$query =@mysql_query( "Insert into $username(fname,file)values('$filename','$uploadfile')")or die("error");


?>
<?php
//http://tieba.baidu.com/f?kz=13975389
 
  function word2html($wfilepath)
  {
      $word=new COM("Word.Application") or die("无法打开 MS Word");
      $word->visible = 1 ;  
      $word->Documents->Open($wfilepath)or die("无法打开这个文件");
     
      $htmlpath=substr($wfilepath,0,-4);
      $word->ActiveDocument->SaveAs($htmlpath,8);
      $word->quit(0);

  }
 print( "Word转html完成!" );
?>
</head>

<body>
</body>
</html>

saveas后面的数字代表要转换的格式,参考:http://msdn.microsoft.com/zh-cn/library/microsoft.office.interop.word.wdsaveformat.aspx

http://jingyan.baidu.com/article/a3761b2b8ed03c1577f9aa60.html

http://msdn.microsoft.com/zh-cn/library/ff194352(v=office.15).aspx

http://stackoverflow.com/questions/10366596/reading-table-contetnts-in-ms-word-file-using-python

http://msdn.microsoft.com/zh-cn/library/ff837519.aspx

http://www.cnblogs.com/oracleblogs/p/3387436.html

http://my.oschina.net/kakablue/blog/170361

http://www.cnblogs.com/rongyilin/archive/2012/12/21/2828007.html

html5:

http://www.starming.com/index.php?action=plugin&v=wave&tpl=union&ac=viewgrouppost&gid=34464&tid=17975

原文地址:https://www.cnblogs.com/youxin/p/3570432.html