首页 > 语言 > PHP > 正文

php解析mht文件转换成html的实例

2024-05-04 23:55:48
字体:
来源:转载
供稿:网友

php解析mht文件,使用编辑器打开可以看到base64编码所以,mht是可以转换成html的。

<?php/** * 针对Mht格式的文件进行解析* 使用例子:* * function mhtmlParseBody($filename) {	if (file_exists ( $filename )) {		if (is_dir ( $filename )) return false;				$filename = strtolower ( $filename );		if (strpos ( $filename, '.mht', 1 ) == FALSE) return false;							$o_mhtml = new mhtml ();		$o_mhtml->set_file ( $filename );		$o_mhtml->extract ();		return $o_mhtml->get_part_to_file(0);	}	return null;}function mhtmlParseAll($filename) {	if (file_exists ( $filename )) {		if (is_dir ( $filename )) return false;		$filename = strtolower ( $filename );		if (strpos ( $filename, '.mht', 1 ) == FALSE) return false;					$o_mhtml = new mhtml ();		$o_mhtml->set_file ( $filename );		$o_mhtml->extract ();		return $o_mhtml->get_all_part_file();	}	return null;}*/class mhtparse {	var $file = '';	var $boundary = '';	var $filedata = '';	var $countparts = 1;	var $log = '';		function extract() {		$this->read_filedata ();		$this->file_parts ();		return 1;	}		function set_file($p) {		$this->file = $p;	}		function get_log() {		return $this->log;	}		function file_parts() {		$lines = explode ( "/n", substr ( $this->filedata, 0, 8192 ) );		foreach ( $lines as $line ) {			$line = trim ( $line );			if (strpos ( $line, '=' ) !== FALSE) {				if (strpos ( $line, 'boundary', 0 ) !== FALSE) {					$range = $this->getrange ( $line, '"', '"', 0 );					$this->boundary = "--" . $range ['range'];					$this->filedata = str_replace ( $line, '', $this->filedata );					break;				}			}		}		if ($this->boundary != '') {			$this->filedata = explode ( $this->boundary, $this->filedata );			unset ( $this->filedata [0] );			$this->filedata = array_values ( $this->filedata );			$this->countparts = count ( $this->filedata );		} else {			$tmp = $this->filedata;			$this->filedata = array (					$tmp 			);		}	}		function get_all_part_file() {		return $this->filedata;	}		function get_part_to_file($i) {		$line_data_start = 0;		$encoding = '';		$part_lines = explode ( "/n", ltrim ( $this->filedata [$i] ) );		foreach ( $part_lines as $line_id => $line ) {			$line = trim ( $line );			if ($line == '') {				if (trim ( $part_lines [0] ) == '--')					return 1;				$line_data_start = $line_id;				break;			}			if (strpos ( $line, ':' ) !== FALSE) {				$pos = strpos ( $line, ':' );				$k = strtolower ( trim ( substr ( $line, 0, $pos ) ) );				$v = trim ( substr ( $line, $pos + 1, strlen ( $line ) ) );				if ($k == 'content-transfer-encoding') {					$encoding = $v;				}				if ($k == 'content-location') {					$location = $v;				}				if ($k == 'content-type') {					$contenttype = $v;				}			}		}				foreach ( $part_lines as $line_id => $line ) {			if ($line_id <= $line_data_start)				$part_lines [$line_id] = '';		}				$part_lines = implode ( '', $part_lines );		if ($encoding == 'base64')			$part_lines = base64_decode ( $part_lines );		elseif ($encoding == 'quoted-printable')			$part_lines = imap_qprint ( $part_lines );				return $part_lines;	}		function read_filedata() {		$handle = fopen ( $this->file, 'r' );		$this->filedata = fread ( $handle, filesize ( $this->file ) );		fclose ( $handle );	}		function getrange(&$subject, $Beginmark_str = '{', $Endmark_str = '}', $Start_pos = 0) {		/*		 * $str="sssss { x { xx } {xx{xx } x} x} sssss"; $range=string::getRange($str,'{','}',0); echo $range['range']; //tulem: " x { xx } {xx{xx } x} x" echo $range['behin']; //tulem: 6 echo $range['end']; //tulem: 30 (' ') -- l5pumärgist järgnev out: array('range'=>$Range,'begin'=>$Begin_firstOccurence_pos,'end'=>$End_sequel_pos) | false v1.1 2004-2006,Uku-Kaarel J5esaar,ukjoesaar@hot.ee,http://www.hot.ee/ukjoesaar,+3725110693		 */		if (empty ( $Beginmark_str ))			$Beginmark_str = '{';		$Beginmark_str_len = strlen ( $Beginmark_str );				if (empty ( $Endmark_str ))			$Endmark_str = '}';		$Endmark_str_len = strlen ( $Endmark_str );				/* $Start_pos_cache = 0; */		do {			/* !algus */			if (! is_int ( $Begin_firstOccurence_pos ))				$Start_pos_cache = $Start_pos;								/* ?algus-test */			$Start_pos_cache = @strpos ( $subject, $Beginmark_str, $Start_pos_cache );						/* this is possible start for range */			if (is_int ( $Start_pos_cache )) {				/* skip */				$Start_pos_cache = ($Start_pos_cache + $Beginmark_str_len);				/* test possible range start pos */				if (is_int ( $Begin_firstOccurence_pos )) {					if ($Start_pos_cache < $range_end_pos)						$rangeClean = 0;					elseif ($Start_pos_cache > $range_end_pos)						$rangeClean = 1;				}				/* here it is */				if (! is_int ( $Begin_firstOccurence_pos ))					$Begin_firstOccurence_pos = $Start_pos_cache;			} /* VIGA NR 0 ALGUST EI OLE */						if (! is_int ( $Start_pos_cache )) {				/* !algus */	/* VIGA NR 1 ALGUSMARKI EI LEITUD : VIIMANE VOIMALIK ALGUS */	if (is_int ( $Begin_firstOccurence_pos ) and ($Start_pos_cache < $range_end_pos))					$rangeClean = 1;				else					return false;			}			if (is_int ( $Begin_firstOccurence_pos ) and ($rangeClean != 1)) {				if (! is_int ( $End_pos_cache ))					$End_sequel_pos = $Begin_firstOccurence_pos;								$End_pos_cache = strpos ( $subject, $Endmark_str, $End_sequel_pos );								/* ok */				if (is_int ( $End_pos_cache ) and ($rangeClean != 1)) {					$range_current_lenght = ($End_pos_cache - $Begin_firstOccurence_pos);					$End_sequel_pos = ($End_pos_cache + $Endmark_str_len);					$range_end_pos = $End_pos_cache;				}				/* VIGA NR 2 LOPPU EI LEITUD */				if (! is_int ( $End_pos_cache ))					if ($End_pos_cache == false)						return false;			}		} while ( $rangeClean < 1 );				if (is_int ( $Begin_firstOccurence_pos ) and is_int ( $range_current_lenght ))			$Range = substr ( $subject, $Begin_firstOccurence_pos, $range_current_lenght );		else			return false;				return array (				'range' => $Range,				'begin' => $Begin_firstOccurence_pos,				'end' => $End_sequel_pos 		);	} // end getrange()} // class?>

以上这篇php解析mht文件转换成html的实例就是小编分享给大家的全部内容了,希望能给大家一个参考,也希望大家多多支持VeVb武林网。


注:相关教程知识阅读请移步到PHP教程频道。
发表评论 共有条评论
用户名: 密码:
验证码: 匿名发表

图片精选