2 source-file.cc -- implement Source_file
4 source file of the GNU LilyPond music typesetter
6 (c) 1997--2006 Jan Nieuwenhuizen <janneke@gnu.org>
7 Han-Wen Nienhuys <hanwen@xs4all.nl>
10 #include "source-file.hh"
15 #include <utf8/wchar.h> /* mbrtowc */
17 #include <cwchar> /* mbrtowc */
26 #define istringstream(x) istrstream (x, length ())
30 #include "file-name-map.hh"
31 #include "international.hh"
35 Source_file::load_stdin ()
39 while ((c = fgetc (stdin)) != EOF)
40 characters_.push_back (c);
42 characters_.push_back (0);
46 gulp_file (string filename, int desired_size)
48 /* "b" must ensure to open literally, avoiding text (CR/LF)
50 FILE *f = fopen (filename.c_str (), "rb");
53 warning (_f ("can't open file: `%s'", filename.c_str ()));
59 fseek (f, 0, SEEK_END);
60 int real_size = ftell (f);
61 int read_count = real_size;
64 read_count = min (read_count, desired_size);
68 char *str = new char[read_count + 1];
71 int bytes_read = fread (str, sizeof (char), read_count, f);
72 if (bytes_read != read_count)
73 warning (_f ("expected to read %d characters, got %d", bytes_read,
76 int filesize = bytes_read;
79 cxx_arr.resize (filesize);
81 /* ugh, how to do neatly in STL? */
82 memcpy (&cxx_arr[0], str, filesize);
89 Source_file::contents_str0 () const
91 return &characters_[0];
104 Source_file::Source_file (string filename, string data)
110 characters_.resize (data.length ());
112 /* ugh, how to do neatly in STL? */
113 memcpy ((&characters_[0]), data.c_str (), data.length ());
117 for (vsize i = 0; i < characters_.size (); i++)
118 if (characters_[i] == '\n')
119 newline_locations_.push_back (&characters_[0] + i);
122 Source_file::Source_file (string filename_string)
126 name_ = filename_string;
128 if (filename_string == "-")
132 characters_ = gulp_file (filename_string, -1);
133 characters_.push_back (0);
138 for (vsize i = 0; i < characters_.size (); i++)
139 if (characters_[i] == '\n')
140 newline_locations_.push_back (&characters_[0] + i);
144 Source_file::init_port ()
146 SCM str = scm_makfrom0str (contents_str0 ());
147 str_port_ = scm_mkstrport (SCM_INUM0, str, SCM_OPN | SCM_RDNG, __FUNCTION__);
148 scm_set_port_filename_x (str_port_, scm_makfrom0str (name_.c_str ()));
153 Source_file::get_istream ()
157 if (length ()) // can-t this be done without such a hack?
158 istream_ = new istringstream (c_str ());
161 istream_ = new istringstream ("");
162 istream_->setstate (ios::eofbit);
163 // istream_->set (ios::eofbit);
170 Source_file::file_line_column_string (char const *context_str0) const
173 return " (" + _ ("position unknown") + ")";
177 get_counts (context_str0, &l, &ch, &col);
179 return name_string () + ":" + to_string (l)
180 + ":" + to_string (col);
185 Source_file::quote_input (char const *pos_str0) const
187 if (!contains (pos_str0))
188 return " (" + _ ("position unknown") + ")";
191 get_counts (pos_str0, &l, &ch, &col);
192 string line = line_string (pos_str0);
193 string context = line.substr (0, ch)
195 + to_string (' ', col)
196 + line.substr (ch, line.length()-ch);
201 Source_file::name_string () const
203 return map_file_name (name_);
206 Source_file::~Source_file ()
213 Source_file::line_slice (char const *pos_str0) const
215 if (!contains (pos_str0))
218 char const *data_str0 = c_str ();
219 char const *eof_C_ = data_str0 + length ();
221 if (pos_str0 == eof_C_)
223 char const *begin_str0 = pos_str0;
224 while (begin_str0 > data_str0)
225 if (*--begin_str0 == '\n')
231 char const *end_str0 = pos_str0;
232 while (end_str0 < eof_C_)
233 if (*end_str0++ == '\n')
239 return Slice (begin_str0 - data_str0, end_str0 - data_str0);
243 Source_file::line_string (char const *pos_str0) const
245 if (!contains (pos_str0))
248 Slice line = line_slice (pos_str0);
249 char const *data_str0 = c_str ();
250 return string (data_str0 + line[LEFT], line.length ());
254 Source_file::get_counts (char const *pos_str0,
263 if (!contains (pos_str0))
266 *line_number = get_line (pos_str0);
268 Slice line = line_slice (pos_str0);
269 char const *data = c_str ();
270 char const *line_start = (char const *)data + line[LEFT];
272 ssize left = (char const *) pos_str0 - line_start;
273 string line_begin (line_start, left);
274 char const *line_chars = line_begin.c_str ();
281 /* Initialize the state. */
282 memset (&state, '\0', sizeof (state));
286 wchar_t multibyte[2];
289 FIXME, this is apparently locale dependent.
292 size_t thislen = mbrtowc (multibyte, line_chars, left, &state);
295 #endif /* !HAVE_MBRTOWC */
297 /* Stop converting at invalid character;
298 this can mean we have read just the first part
299 of a valid character. */
300 if (thislen == (size_t) -1)
303 /* We want to handle embedded NUL bytes
304 but the return value is 0. Correct this. */
308 if (thislen == 1 && line_chars[0] == '\t')
309 (*column) = (*column / 8 + 1) * 8;
314 /* Advance past this character. */
315 line_chars += thislen;
321 Source_file::contains (char const *pos_str0) const
323 return (pos_str0 && (pos_str0 >= c_str ()) && (pos_str0 <= c_str () + length ()));
327 Source_file::get_line (char const *pos_str0) const
329 if (!contains (pos_str0))
332 if (!newline_locations_.size ())
336 vsize hi = newline_locations_.size ();
338 if (newline_locations_[lo] > pos_str0)
341 if (newline_locations_[hi - 1] < pos_str0)
344 binary_search_bounds (newline_locations_,
345 (char const*&)pos_str0,
349 if (*pos_str0 == '\n')
351 return lo + 2 + line_offset_;
355 Source_file::set_line (char const *pos_str0, int line)
357 int current_line = get_line (pos_str0);
358 line_offset_ += line - current_line;
360 assert (line == get_line (pos_str0));
364 Source_file::length () const
366 return characters_.size ();
370 Source_file::c_str () const
372 return &characters_[0];
376 Source_file::get_port () const
381 /****************************************************************/
383 #include "ly-smobs.icc"
385 IMPLEMENT_SMOBS(Source_file);
386 IMPLEMENT_DEFAULT_EQUAL_P(Source_file);
387 IMPLEMENT_TYPE_P(Source_file, "ly:source-file?");
390 Source_file::mark_smob (SCM smob)
392 Source_file *sc = (Source_file *) SCM_CELL_WORD_1 (smob);
394 return sc->str_port_;
399 Source_file::print_smob (SCM smob, SCM port, scm_print_state *)
401 Source_file *sc = (Source_file *) SCM_CELL_WORD_1 (smob);
403 scm_puts ("#<Source_file ", port);
404 scm_puts (sc->name_.c_str (), port);
406 /* Do not print properties, that is too much hassle. */
407 scm_puts (" >", port);