Commit caef7872 by Francois-Xavier Coudert Committed by François-Xavier Coudert

re PR fortran/31645 (Error on reading Byte Order Mark)

	PR fortran/31645

	* scanner.c (load_file): Discard the byte order mark if one is
	found on the first non-preprocessor line of a file.

	* testsuite/gfortran.dg/bom_error.f90: New test.
	* testsuite/gfortran.dg/bom_include.f90: New test.
	* testsuite/gfortran.dg/bom_UTF16-LE.f90: New test.
	* testsuite/gfortran.dg/bom_UTF16-BE.f90: New test.
	* testsuite/gfortran.dg/bom_UTF-8.f90: New test.
	* testsuite/gfortran.dg/bom_UTF-32.f90: New test.
	* testsuite/gfortran.dg/bom_UTF-8.F90: New test.
	* testsuite/gfortran.dg/bom_include.inc: New file.

From-SVN: r124274
parent 70ec16f7
2007-04-29 Francois-Xavier Coudert <fxcoudert@gcc.gnu.org>
PR fortran/31645
* scanner.c (load_file): Discard the byte order mark if one is
found on the first non-preprocessor line of a file.
2007-04-29 Paul Thomas <pault@gcc.gnu.org>
PR fortran/31711
......
......@@ -1404,6 +1404,7 @@ load_file (const char *filename, bool initial)
gfc_file *f;
FILE *input;
int len, line_len;
bool first_line;
for (f = current_file; f; f = f->up)
if (strcmp (filename, f->filename) == 0)
......@@ -1445,6 +1446,7 @@ load_file (const char *filename, bool initial)
current_file->line = 1;
line = NULL;
line_len = 0;
first_line = true;
if (initial && gfc_src_preprocessor_lines[0])
{
......@@ -1467,6 +1469,26 @@ load_file (const char *filename, bool initial)
if (feof (input) && len == 0)
break;
/* If this is the first line of the file, it can contain a byte
order mark (BOM), which we will ignore:
FF FE is UTF-16 little endian,
FE FF is UTF-16 big endian,
EF BB BF is UTF-8. */
if (first_line
&& ((line_len >= 2 && line[0] == '\xFF' && line[1] == '\xFE')
|| (line_len >= 2 && line[0] == '\xFE' && line[1] == '\xFF')
|| (line_len >= 3 && line[0] == '\xEF' && line[1] == '\xBB'
&& line[2] == '\xBF')))
{
int n = line[1] == '\xBB' ? 3 : 2;
char * new = gfc_getmem (line_len);
strcpy (new, line + n);
gfc_free (line);
line = new;
len -= n;
}
/* There are three things this line can be: a line of Fortran
source, an include line or a C preprocessor directive. */
......@@ -1476,6 +1498,11 @@ load_file (const char *filename, bool initial)
continue;
}
/* Preprocessed files have preprocessor lines added before the byte
order mark, so first_line is not about the first line of the file
but the first line that's not a preprocessor line. */
first_line = false;
if (include_line (line))
{
current_file->line++;
......
2007-04-29 Francois-Xavier Coudert <fxcoudert@gcc.gnu.org>
PR fortran/31645
* testsuite/gfortran.dg/bom_error.f90: New test.
* testsuite/gfortran.dg/bom_include.f90: New test.
* testsuite/gfortran.dg/bom_UTF16-LE.f90: New test.
* testsuite/gfortran.dg/bom_UTF16-BE.f90: New test.
* testsuite/gfortran.dg/bom_UTF-8.f90: New test.
* testsuite/gfortran.dg/bom_UTF-32.f90: New test.
* testsuite/gfortran.dg/bom_UTF-8.F90: New test.
* testsuite/gfortran.dg/bom_include.inc: New file.
2007-04-28 Andrew Pinski <andrew_pinski@playstation.sony.com>
PR C++/30221
print *, "Hello world"
end
! { dg-do compile }
print *, "Hello world"
end
! { dg-do compile }
! { dg-do compile }
include "bom_include.inc"
print *, "Hello world!"
end
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment