1 /////////////////////////////////////////////////////////////////////////////
2 // Name:        src/html/htmlfilt.cpp
3 // Purpose:     wxHtmlFilter - input filter for translating into HTML format
4 // Author:      Vaclav Slavik
5 // Copyright:   (c) 1999 Vaclav Slavik
6 // Licence:     wxWindows licence
7 /////////////////////////////////////////////////////////////////////////////
8 
9 #include "wx/wxprec.h"
10 
11 #ifdef __BORLANDC__
12     #pragma hdrstop
13 #endif
14 
15 #if wxUSE_HTML && wxUSE_STREAMS
16 
17 #ifndef WX_PRECOMP
18     #include "wx/log.h"
19     #include "wx/intl.h"
20 #endif
21 
22 #include "wx/strconv.h"
23 #include "wx/sstream.h"
24 #include "wx/html/htmlfilt.h"
25 #include "wx/html/htmlwin.h"
26 
27 // utility function: read entire contents of an wxInputStream into a wxString
28 //
29 // TODO: error handling?
ReadString(wxString & str,wxInputStream * s,wxMBConv & conv)30 static void ReadString(wxString& str, wxInputStream* s, wxMBConv& conv)
31 {
32     wxStringOutputStream out(&str, conv);
33     s->Read(out);
34 }
35 
36 /*
37 
38 There is code for several default filters:
39 
40 */
41 
IMPLEMENT_ABSTRACT_CLASS(wxHtmlFilter,wxObject)42 IMPLEMENT_ABSTRACT_CLASS(wxHtmlFilter, wxObject)
43 
44 //--------------------------------------------------------------------------------
45 // wxHtmlFilterPlainText
46 //          filter for text/plain or uknown
47 //--------------------------------------------------------------------------------
48 
49 IMPLEMENT_DYNAMIC_CLASS(wxHtmlFilterPlainText, wxHtmlFilter)
50 
51 bool wxHtmlFilterPlainText::CanRead(const wxFSFile& WXUNUSED(file)) const
52 {
53     return true;
54 }
55 
56 
57 
ReadFile(const wxFSFile & file) const58 wxString wxHtmlFilterPlainText::ReadFile(const wxFSFile& file) const
59 {
60     wxInputStream *s = file.GetStream();
61     wxString doc, doc2;
62 
63     if (s == NULL) return wxEmptyString;
64     ReadString(doc, s, wxConvISO8859_1);
65 
66     doc.Replace(wxT("&"), wxT("&"), true);
67     doc.Replace(wxT("<"), wxT("&lt;"), true);
68     doc.Replace(wxT(">"), wxT("&gt;"), true);
69     doc2 = wxT("<HTML><BODY><PRE>\n") + doc + wxT("\n</PRE></BODY></HTML>");
70     return doc2;
71 }
72 
73 
74 
75 
76 
77 //--------------------------------------------------------------------------------
78 // wxHtmlFilterImage
79 //          filter for image/*
80 //--------------------------------------------------------------------------------
81 
82 class wxHtmlFilterImage : public wxHtmlFilter
83 {
84     DECLARE_DYNAMIC_CLASS(wxHtmlFilterImage)
85 
86     public:
87         virtual bool CanRead(const wxFSFile& file) const;
88         virtual wxString ReadFile(const wxFSFile& file) const;
89 };
90 
IMPLEMENT_DYNAMIC_CLASS(wxHtmlFilterImage,wxHtmlFilter)91 IMPLEMENT_DYNAMIC_CLASS(wxHtmlFilterImage, wxHtmlFilter)
92 
93 
94 
95 bool wxHtmlFilterImage::CanRead(const wxFSFile& file) const
96 {
97     return (file.GetMimeType().Left(6) == wxT("image/"));
98 }
99 
100 
101 
ReadFile(const wxFSFile & file) const102 wxString wxHtmlFilterImage::ReadFile(const wxFSFile& file) const
103 {
104     wxString res = wxT("<HTML><BODY><IMG SRC=\"") + file.GetLocation() + wxT("\"></BODY></HTML>");
105     return res;
106 }
107 
108 
109 
110 
111 //--------------------------------------------------------------------------------
112 // wxHtmlFilterHTML
113 //          filter for text/html
114 //--------------------------------------------------------------------------------
115 
116 
IMPLEMENT_DYNAMIC_CLASS(wxHtmlFilterHTML,wxHtmlFilter)117 IMPLEMENT_DYNAMIC_CLASS(wxHtmlFilterHTML, wxHtmlFilter)
118 
119 bool wxHtmlFilterHTML::CanRead(const wxFSFile& file) const
120 {
121 //    return (file.GetMimeType() == "text/html");
122 // This is true in most case but some page can return:
123 // "text/html; char-encoding=...."
124 // So we use Find instead
125   return (file.GetMimeType().Find(wxT("text/html")) == 0);
126 }
127 
128 
129 
ReadFile(const wxFSFile & file) const130 wxString wxHtmlFilterHTML::ReadFile(const wxFSFile& file) const
131 {
132     wxInputStream *s = file.GetStream();
133     wxString doc;
134 
135     if (s == NULL)
136     {
137         wxLogError(_("Cannot open HTML document: %s"), file.GetLocation().c_str());
138         return wxEmptyString;
139     }
140 
141     // NB: We convert input file to wchar_t here in Unicode mode, based on
142     //     either Content-Type header or <meta> tags. In ANSI mode, we don't
143     //     do it as it is done by wxHtmlParser (for this reason, we add <meta>
144     //     tag if we used Content-Type header).
145 #if wxUSE_UNICODE
146     int charsetPos;
147     if ((charsetPos = file.GetMimeType().Find(wxT("; charset="))) != wxNOT_FOUND)
148     {
149         wxString charset = file.GetMimeType().Mid(charsetPos + 10);
150         wxCSConv conv(charset);
151         ReadString(doc, s, conv);
152     }
153     else
154     {
155         size_t size = s->GetSize();
156         wxCharBuffer buf( size );
157         s->Read( buf.data(), size );
158         wxString tmpdoc( buf, wxConvISO8859_1);
159 
160         wxString charset = wxHtmlParser::ExtractCharsetInformation(tmpdoc);
161         if (charset.empty())
162             doc = tmpdoc;
163         else
164         {
165             wxCSConv conv(charset);
166             doc = wxString( buf, conv );
167         }
168     }
169 #else // !wxUSE_UNICODE
170     ReadString(doc, s, wxConvLibc);
171     // add meta tag if we obtained this through http:
172     if (!file.GetMimeType().empty())
173     {
174         wxString hdr;
175         wxString mime = file.GetMimeType();
176         hdr.Printf(wxT("<meta http-equiv=\"Content-Type\" content=\"%s\">"), mime.c_str());
177         return hdr+doc;
178     }
179 #endif
180 
181     return doc;
182 }
183 
184 
185 
186 
187 ///// Module:
188 
189 class wxHtmlFilterModule : public wxModule
190 {
191     DECLARE_DYNAMIC_CLASS(wxHtmlFilterModule)
192 
193     public:
OnInit()194         virtual bool OnInit()
195         {
196             wxHtmlWindow::AddFilter(new wxHtmlFilterHTML);
197             wxHtmlWindow::AddFilter(new wxHtmlFilterImage);
198             return true;
199         }
OnExit()200         virtual void OnExit() {}
201 };
202 
203 IMPLEMENT_DYNAMIC_CLASS(wxHtmlFilterModule, wxModule)
204 
205 #endif
206