2 source-file.cc -- implement Source_file
4 source file of the GNU LilyPond music typesetter
6 (c) 1997--2005 Jan Nieuwenhuizen <janneke@gnu.org>
7 Han-Wen Nienhuys <hanwen@cs.uu.nl>
10 #include "source-file.hh"
15 #include <utf8/wchar.h> /* wcrtomb */
17 #include <wchar.h> /* wcrtomb */
26 #define istringstream(x) istrstream (x, length ())
30 #include "file-name-map.hh"
33 Source_file::load_stdin ()
38 Array<char> chs; // ugh.
39 while ((c = fgetc (stdin)) != EOF)
43 length_ = chs.size ();
44 contents_str0_ = chs.remove_array ();
48 gulp_file (String filename, int *filesize)
50 /* "b" must ensure to open literally, avoiding text (CR/LF)
52 FILE *f = fopen (filename.to_str0 (), "rb");
55 warning (_f ("can't open file: `%s'", filename.to_str0 ()));
59 fseek (f, 0, SEEK_END);
60 *filesize = ftell (f);
63 char *str = new char[*filesize + 1];
66 int bytes_read = fread (str, sizeof (char), *filesize, f);
67 if (bytes_read != *filesize)
68 warning (_f ("expected to read %d characters, got %d", bytes_read,
75 Source_file::Source_file (String filename, String data)
79 contents_str0_ = data.get_copy_str0 ();
80 length_ = data.length ();
81 pos_str0_ = to_str0 ();
84 for (int i = 0; i < length_; i++)
85 if (contents_str0_[i] == '\n')
86 newline_locations_.push (contents_str0_ + i);
89 Source_file::Source_file (String filename_string)
91 name_ = filename_string;
95 if (filename_string == "-")
98 contents_str0_ = gulp_file (filename_string, &length_);
100 pos_str0_ = to_str0 ();
104 for (int i = 0; i < length_; i++)
105 if (contents_str0_[i] == '\n')
106 newline_locations_.push (contents_str0_ + i);
110 Source_file::init_port ()
112 SCM str = scm_makfrom0str (contents_str0_);
113 str_port_ = scm_mkstrport (SCM_INUM0, str, SCM_OPN | SCM_RDNG, __FUNCTION__);
114 scm_set_port_filename_x (str_port_, scm_makfrom0str (name_.get_str0 ()));
118 Source_file::tell () const
120 return pos_str0_ - contents_str0_;
124 Source_file::get_istream ()
128 if (length ()) // can-t this be done without such a hack?
129 istream_ = new std::istringstream (to_str0 ());
132 istream_ = new std::istringstream ("");
133 istream_->setstate (std::ios::eofbit);
134 // istream_->set (ios::eofbit);
141 Source_file::file_line_column_string (char const *context_str0) const
144 return " (" + _ ("position unknown") + ")";
146 return name_string () + ":" + to_string (get_line (context_str0))
147 + ":" + to_string (get_column (context_str0));
151 Source_file::name_string () const
153 return map_file_name (name_);
156 Source_file::~Source_file ()
160 delete[] contents_str0_;
164 Source_file::line_slice (char const *pos_str0) const
166 if (!contains (pos_str0))
169 char const *data_str0 = to_str0 ();
170 char const *eof_C_ = data_str0 + length ();
172 if (pos_str0 == eof_C_)
174 char const *begin_str0 = pos_str0;
175 while (begin_str0 > data_str0)
176 if (*--begin_str0 == '\n')
182 char const* end_str0 = pos_str0;
183 while (end_str0 < eof_C_)
184 if (*end_str0++ == '\n')
190 return Slice (begin_str0 - data_str0, end_str0 - data_str0);
194 Source_file::line_string (char const* pos_str0) const
196 if (!contains (pos_str0))
199 Slice line = line_slice (pos_str0);
200 char const *data_str0 = to_str0 ();
201 return String ((Byte const *)data_str0 + line[LEFT], line.length ());
205 Source_file::get_char_of_line (char const *pos_str0) const
207 if (!contains (pos_str0))
210 char const *data_str0 = to_str0 ();
211 return pos_str0 - (line_slice (pos_str0)[SMALLER] + data_str0);
215 Source_file::get_column (char const *pos_str0) const
217 if (!contains (pos_str0))
220 Slice line = line_slice (pos_str0);
221 char const *data = to_str0 ();
222 Byte const *line_start = (Byte const *)data + line[LEFT];
224 int left = (Byte const*) pos_str0 - line_start;
225 String line_begin (line_start, left);
226 char const *line_chars = line_begin.to_str0();
231 /* Initialize the state. */
232 memset (&state, '\0', sizeof (state));
236 wchar_t multibyte[2];
237 size_t thislen = mbrtowc (multibyte, line_chars, left, &state);
239 /* Stop converting at invalid character;
240 this can mean we have read just the first part
241 of a valid character. */
242 if (thislen == (size_t) -1)
244 /* We want to handle embedded NUL bytes
245 but the return value is 0. Correct this. */
249 if (thislen == 1 && line_chars[0] == '\t')
250 column = (column / 8 + 1) * 8;
254 /* Advance past this character. */
255 line_chars += thislen;
263 Source_file::error_string (char const* pos_str0) const
265 if (!contains (pos_str0))
266 return " (" + _ ("position unknown") + ")";
268 int ch_i = get_char_of_line (pos_str0);
269 String line = line_string (pos_str0);
270 String context = line.left_string (ch_i)
272 + to_string (' ', get_column (pos_str0))
273 + line.cut_string (ch_i, INT_MAX);
279 Source_file::contains (char const* pos_str0) const
281 return (pos_str0 && (pos_str0 >= to_str0 ()) && (pos_str0 <= to_str0 () + length ()));
285 Source_file::get_line (char const* pos_str0) const
287 if (!contains (pos_str0))
290 if (!newline_locations_.size ())
294 int hi = newline_locations_.size ();
296 if (newline_locations_[lo] > pos_str0)
299 if (newline_locations_[hi-1] < pos_str0)
302 binary_search_bounds (newline_locations_,
304 Link_array<char>::default_compare,
307 if (*pos_str0 == '\n')
313 Source_file::length () const
319 Source_file::to_str0 () const
321 return contents_str0_;
325 Source_file::set_pos (char const * pos_str0)
327 if (contains (pos_str0))
328 pos_str0_ = pos_str0;
330 error (error_string (pos_str0) + "invalid pos");
334 Source_file::seek_str0 (int n)
336 char const *new_str0 = to_str0 () + n;
338 new_str0 += length ();
339 if (contains (new_str0))
340 pos_str0_ = new_str0;
342 error (error_string (new_str0) + "seek past eof");
348 Source_file::forward_str0 (int n)
350 char const *old_pos = pos_str0_;
351 char const *new_str0 = pos_str0_ + n;
352 if (contains (new_str0))
353 pos_str0_ = new_str0;
355 error (error_string (new_str0) + "forward past eof");
361 Source_file::get_string (int n)
363 String str = String ((Byte const *)forward_str0 (n), n);