File: ForumMLInsert.class.php

package info (click to toggle)
fusionforge 5.3.2%2B20141104-3
  • links: PTS, VCS
  • area: main
  • in suites: jessie-kfreebsd
  • size: 60,472 kB
  • sloc: php: 271,846; sql: 36,817; python: 14,575; perl: 6,406; sh: 5,980; xml: 4,294; pascal: 1,411; makefile: 911; cpp: 52; awk: 27
file content (330 lines) | stat: -rw-r--r-- 12,434 bytes parent folder | download | duplicates (4)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
<?php
#
# Copyright (c) STMicroelectronics, 2005. All Rights Reserved.

 # Originally written by Jean-Philippe Giola, 2005
 #
 # This file is a part of codendi.
 #
 # codendi is free software; you can redistribute it and/or modify
 # it under the terms of the GNU General Public License as published by
 # the Free Software Foundation; either version 2 of the License, or
 # (at your option) any later version.
 #
 # codendi is distributed in the hope that it will be useful,
 # but WITHOUT ANY WARRANTY; without even the implied warranty of
 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 # GNU General Public License for more details.
 #
 # You should have received a copy of the GNU General Public License along
 # with this program; if not, write to the Free Software Foundation, Inc.,
 # 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
 #
 # $Id$
 #
require_once 'ForumML_MessageDao.class.php';

// ForumML Database Query Class
class ForumMLInsert {
    var $id_message;
    var $mail;
    var $id_list;
    var $dao;

    // Class Constructor
	function __construct($list_id) {
		// set id_list
		$this->id_list = $list_id;
		$this->dao = new ForumML_MessageDao(CodendiDataAccess::instance());
	}

    // Insert values into forumml_messageheader table
    function insertMessageHeader($id_header,$value) {
	$this->dao->insertMessageHeader($this->id_message,$id_header,$value);
    }

    // Insert values into forumml_attachment table
    function insertAttachment($id_message, $filename,$filetype,$filepath,$content_id="") {
        if (is_file($filepath)) {
            $filesize = filesize($filepath);
        } else {
            $filesize = 0;
        }
	$this->dao->insertAttachment($id_message, $filename, $filetype, $filesize, $filepath,$content_id);
    }

    // Insert values into forumml_header table
    function insertHeader($header) {

    	// Search if the header is already in the table
       $result = $this->dao->searchHeader($header);
        // If not, insert it
       if ($result->rowCount()<1) {
	       return $this->dao->insertHeader($header);
       } else {
	       $row=$result->getRow();
	       return $row['id_header'];
       }
    }

    function getParentMessageFromHeader($messageIdHeader) {
	    $result = $this->dao->getParentMessageFromHeader($messageIdHeader) ;
	    if ($result && $result->rowCount() >= 1 ) {
		    $row = $result->getRow();
		    return $row['id_message'];
	    }
	    return false;

    }

    function updateParentDate($messageId, $date) {
	    if ($messageId != 0) {
		    $dar = $this->dao->getParents($messageId);
		    if ($dar) {
			    $row = $dar->getRow();
			    if ($date > $row['last_thread_update']) {
				    $this->dao->updateParentDate($messageId, $date);

				    $this->updateParentDate($row['id_parent'], $date);
			    }
		    }
	    }
    }

    // Insert values into forumml_message table
    function insertMessage($structure,$body,$ctype="") {

	    $this->mail = $structure;

	    if (isset($structure["in-reply-to"])) {
		    // special case: 'in-reply-to' header may contain "Message from ... "
		    if (preg_match('/^Message from.*$/',$structure["in-reply-to"])) {
			    $arr = explode(" ",$structure["in-reply-to"]);
			    $reply_to = $arr[count($structure["in-reply-to"]) - 1];
		    } else {
			    $reply_to = $structure["in-reply-to"];
		    }
	    } else {
		    if (isset($structure["references"])) {
			    // special case: 'in-reply-to' header is not set, but 'references' - which contain list of parent messages ids - is set
			    $ref_arr = explode(" ",$structure["references"]);
			    $reply_to = $ref_arr[count($structure["references"]) - 1];
		    } else {
			    $reply_to = "";
		    }
	    }

	    // Message date
	    // Cannot rely on server's date because it might be different
	    // and it doesn't work when it comes to load mail archives!
	    $messageDate = strtotime($structure['date']);

	    $id_parent = 0;
	    // If the current message is an answer
	    if ($reply_to != "") {
		    $id_parent = $this->getParentMessageFromHeader($reply_to);
	    }

	    if ($id_parent != 0) {
		    $this->updateParentDate($id_parent, $messageDate);
	    }
$this->id_message = $this->dao->insertMessage($this->id_list,  $id_parent , $body , $messageDate , $ctype);

	    // All headers of the current mail are stored in the forumml_messageheader table
	    $k=0;
	    foreach ($structure as $header => $value_header) {
		    $k++;
		    if ($k != 1) {
			    if ($header != "received") {
				    $id_header = $this->insertHeader($header);
				    if (is_array($value_header)) {
					    $value_header = implode(",",$value_header);
				    }
				    $this->insertMessageHeader($id_header,$value_header);
			    }
		    }
	    }

	    return $this->id_message;
    }

    /**
     * Encode string in UTF8 if source charset given or if detected
     */
    function getUtf8String($string,$charset=null) {
	    if ($charset == null) {
		    $charset = mb_detect_encoding($string);
	    }
	    if ($charset) {
		    return mb_convert_encoding($string, 'UTF-8', $charset);
	    } else {
		    return $string;
	    }
    }

    /**
     * Convert structure body to utf8 if charset defined in structure headers
     */
    function getUtf8Body($structure) {
	    $charset = null;
	    if (isset($structure->headers["content-type"]) && isset($structure->ctype_parameters['charset'])) {
		    $charset = $structure->ctype_parameters['charset'];
	    }
	    if (isset($structure->body)) {
		    return $this->getUtf8String($structure->body, $charset);
	    } else {
		    return '';
	    }
    }

    /**
     * Extract from given structure the content and store it as an attachment of the given message
     *
     * @param Integer             $messageId   Message id
     * @param Object              $struct      Subpart of a Mime message to treat
     * @param Object              $mailHeaders Headers of the message (not the subpart)
     * @param ForumML_FileStorage $storage     Object that manage the file storage on FS
     */
    function storePart($messageId, $struct, $mailHeaders, $storage) {
	    if (isset($struct->body) && trim($struct->body) != "") {
		    $body = $struct->body;
		    $filetype = $struct->headers["content-type"];
		    if ($struct->ctype_primary == 'text' && $struct->ctype_secondary == 'html') {
			    $filename = "message_".substr($mailHeaders["message-id"], 1, strpos($mailHeaders["message-id"], '@') - 1).".html";
		    } else {
			    if (! isset($struct->d_parameters["filename"])) {
				    // special case where a content is attached, without filename
				    $pos = strpos($filetype,"name=");
				    if ($pos === false) {
					    // set filename to 'attachment_<k>'
					    $filename = "attachment";
				    } else {
					    // get filename from 'name' section
					    $filename = substr(substr($filetype,$pos),6,-1);
				    }
			    } else {
				    $filename = $struct->d_parameters["filename"];
			    }
		    }
		    $basename = basename($filename);

		    // For multipart/related emails
		    $content_id = '';
		    if (isset($struct->headers['content-id'])) {
			    $content_id = $struct->headers['content-id'];
		    }

		    // store attachment in /var/lib/codendi/forumml/<listname>/<Y_M_D>
		    $date  = date("Y_m_d",strtotime($mailHeaders["date"]));
		    $fpath = $storage->store($basename, $struct->body, $this->id_list, $date);

		    // insert attachment in the DB
		    $this->insertAttachment($messageId, $basename, $filetype, $fpath, $content_id);
	    }
    }

    /**
     * Parse recursively Mime message to create the message and it's attachments in DB
     *
     * A MIME message is a hierarchical organization that maybe very
     * simple for a text message (just one structure with headers and
     * a text body) to a very complex HTML mail with inline images,
     * attachments sent in Text+HTML.
     *
     * The main challenge of this method is to find the "root" of the
     * MIME message to store it as a message in the DB, all the other
     * stuff will be attached to this message as an attachment.
     *
     * The root message can be either:
     * - The text version of the message. This applies for
     *   -> mail in plain text (with or without attachments)
     *   -> mail in HTML sent in Text+HTML
     * - If no text version available:
     *   -> if their is an HTML version of the mail, we store it
     *      (happens with mail sent in HTML only).
     *   -> if their is no HTML, we store an empty body.
     *
     * How do we detect the root message:
     * -> We crawl the hierarchy and we take the first text/plain or
     *    text/html part.
     * -> Otherwise, if we are about to store an attachment (an
     *    attachment is everything but first text/plain or first
     *    text/html) we create a empty message.
     *
     * @see http://en.wikipedia.org/wiki/MIME
     *
     * @param Object              $struct      Subpart of a Mime message to treat
     * @param Object              $mailHeaders Headers of the message (not the subpart)
     * @param ForumML_FileStorage $storage     Object that manage the file storage on FS
     * @param Integer             $messageId   Message id
     */
    function storeMime($struct, $mailHeaders, $storage, $messageId=0) {
	    if ($struct->ctype_primary == 'multipart') {
		    foreach ($struct->parts as $part) {
			    $messageId = $this->storeMime($part, $mailHeaders, $storage, $messageId);
		    }
	    } else {
		    $inserted = false;
		    if ($struct->ctype_primary == 'text') {
			    switch ($struct->ctype_secondary) {
				    case 'html':
				    case 'plain':
					    if ($messageId == null) {
						    $body      = $this->getUtf8Body($struct);
						    if (isset($struct->headers["content-type"])) {
							    $ctype = $struct->headers["content-type"];
						    } else {
							    $ctype = "";
						    }
						    $messageId = $this->insertMessage($mailHeaders, $body, $ctype);
						    $inserted  = true;
					    }
					    break;
			    }
		    }

		    if ($messageId == 0) {
			    if (isset($struct->headers["content-type"])) {
				    $ctype = $struct->headers["content-type"];
			    } else {
				    $ctype = "";
			    }
			    $messageId = $this->insertMessage($mailHeaders, "", $ctype);
		    }

		    if (!$inserted) {
			    $this->storePart($messageId, $struct, $mailHeaders, $storage);
		    }
	    }
	    return $messageId;
    }

    /**
     * Abandon all hope you who enter here! Mail & MIME is at best a nightmare, take a couple of
     * bottles before diving into this code...
     * http://en.wikipedia.org/wiki/MIME
     *
     * List (not comprehensive) of email possibilities
     * Text                                                         text/plain
     * -> pure_text.mbox
     * Text + attached files                                        multipat/mixed (text/plain, other/mime)
     * -> text_plus_attachment.mbox
     * HTML (sent in Text + HTML)                                   multipart/alternative (text/plain, text/html)
     * -> pure_html_text_plus_html.mbox
     * HTML (sent in HTML)                                          text/html
     * -> pure_html_in_html_only.mbox
     * HTML + inline image (sent in Text + HTML)                    multipart/alternative(text/plain, multipart/related(text/html, image/png))
     * -> html_with_inline_content_in_text_plus_html.mbox
     * HTML + inline image (sent in HTML)                           multipart/related(text/html, image/png)
     * -> html_with_inline_content_in_html_only.mbox
     * HTML + attached file (sent in Text + HTML)                   multipart/mixed(multipart/alternative(text/plain, text/html), other/mime))
     * HTML + attached file (sent in HTML)                          multipart/mixed(text/html, other/mime)
     * HTML + inline image + attached file (sent in Text + HTML)    multipart/mixed(multipart/alternative(text/plain, multipart/related(text/html, image/png)), other/mime)
     * -> html_with_inline_content_and_attch_in_text_plus_html.mbox
     * HTML + inline image + attached file (sent in HTML)           multipart/mixed(multipart/related(text/html, image/png), other/mime)
     * -> html_with_inline_content_and_attch_in_html_only.mbox
     */
    public function storeEmail($email, $storage) {
	    return $this->storeMime($email, $email->headers, $storage);
    }
}