binutils-gdb/gdb/testsuite/gdb.base/charset.c
Tiezhu Yang e31cf164b4 gdb: testsuite: make string[] type as char in gdb.base/charset.c
This reverts the commit ff656e2e1c ("gdb: testsuite: fix failed
testcases in gdb.base/charset.exp").

The original test code has no problem. On an architecture where
char is signed, then both 'A' and ebcdic_us_string[7] will yield
-63, which makes the equality true. On an architecture where char
is unsigned, then both 'A' and ebcdic_us_string[7] will yield 193,
which also makes the equality true.

The test cases only failed on LoongArch. The default type of char
is signed char on LoongArch, like x86-64. But when use gdb print
command on LoongArch, the default type of char is unsigned char,
this is wrong, I will look into it later, sorry for that.

On LoongArch:

  $ cat test_char.c
  #include <stdio.h>

  int main()
  {
          char c1 = 193;
          unsigned char c2 = 193;

          printf("%d\n", c1);
          printf("%d\n", c1 == c2);

          return 0;
  }
  $ gcc test_char.c -o test_char
  $ ./test_char
  -63
  0

  (gdb) set target-charset EBCDIC-US
  (gdb) print 'A'
  $1 = 193 'A'
  (gdb) print /c 'A'
  $2 = 193 'A'
  (gdb) print /u 'A'
  $3 = 193
  (gdb) print /d 'A'
  $4 = -63
  (gdb) print /x 'A'
  $5 = 0xc1

Signed-off-by: Tiezhu Yang <yangtiezhu@loongson.cn>
2022-01-13 11:12:55 +08:00

203 lines
5.7 KiB
C

/* This testcase is part of GDB, the GNU debugger.
Copyright 2001-2022 Free Software Foundation, Inc.
Contributed by Red Hat, originally written by Jim Blandy.
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; either version 3 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program. If not, see <http://www.gnu.org/licenses/>.
Please email any bugs, comments, and/or additions to this file to:
bug-gdb@gnu.org */
/* X_string is a null-terminated string in the X charset whose
elements are as follows. X should be the name the `set charset'
command uses for the character set, in lower-case, with any
non-identifier characters replaced with underscores. Where a
character set doesn't have the given character, the string should
contain the character 'x'.
[0] --- the `alert' character, '\a'
[1] --- the `backspace' character, '\b'
[2] --- the `form feed' character, '\f'
[3] --- the `line feed' character, '\n'
[4] --- the `carriage return' character, '\r'
[5] --- the `horizontal tab' character, '\t'
[6] --- the `vertical tab' character, '\v'
[7 .. 32] --- the uppercase letters A-Z
[33 .. 58] --- the lowercase letters a-z
[59 .. 68] --- the digits 0-9
[69] --- the `cent' character
[70] --- a control character with no defined backslash escape
Feel free to extend these as you like. */
#define NUM_CHARS (71)
char ascii_string[NUM_CHARS];
char iso_8859_1_string[NUM_CHARS];
char ebcdic_us_string[NUM_CHARS];
char ibm1047_string[NUM_CHARS];
#ifndef __cplusplus
/* We make a phony wchar_t and then pretend that this platform uses
UTF-32 (or UTF-16, depending on the size -- same difference for the
purposes of this test). */
typedef unsigned int wchar_t;
/* We also define a couple phony types for testing the u'' and U''
support. It is ok if these have the wrong size on some platforms
-- the test case will skip the tests in that case. */
typedef unsigned short char16_t;
typedef unsigned int char32_t;
#endif
wchar_t utf_32_string[NUM_CHARS];
/* Make sure to use the typedefs. */
char16_t uvar;
char32_t Uvar;
char16_t *String16;
char32_t *String32;
/* A typedef to a typedef should also work. */
typedef wchar_t my_wchar_t;
my_wchar_t myvar;
/* Some arrays for simple assignment tests. */
short short_array[3];
int int_array[3];
long long_array[3];
/* These are unsigned char so we can pass down characters >127 without
explicit casts or warnings. */
void
init_string (char string[],
unsigned char x,
unsigned char alert,
unsigned char backspace,
unsigned char form_feed,
unsigned char line_feed,
unsigned char carriage_return,
unsigned char horizontal_tab,
unsigned char vertical_tab,
unsigned char cent,
unsigned char misc_ctrl)
{
int i;
for (i = 0; i < NUM_CHARS; ++i)
string[i] = x;
string[0] = alert;
string[1] = backspace;
string[2] = form_feed;
string[3] = line_feed;
string[4] = carriage_return;
string[5] = horizontal_tab;
string[6] = vertical_tab;
string[69] = cent;
string[70] = misc_ctrl;
}
void
fill_run (char string[], int start, int len, int first)
{
int i;
for (i = 0; i < len; i++)
string[start + i] = first + i;
}
void
init_utf32 ()
{
int i;
for (i = 0; i < NUM_CHARS; ++i)
utf_32_string[i] = iso_8859_1_string[i] & 0xff;
}
extern void malloc_stub (void);
int main ()
{
malloc_stub ();
/* Initialize ascii_string. */
init_string (ascii_string,
120,
7, 8, 12,
10, 13, 9,
11, 120, 17);
fill_run (ascii_string, 7, 26, 65);
fill_run (ascii_string, 33, 26, 97);
fill_run (ascii_string, 59, 10, 48);
/* Initialize iso_8859_1_string. */
init_string (iso_8859_1_string,
120,
7, 8, 12,
10, 13, 9,
11, 162, 17);
fill_run (iso_8859_1_string, 7, 26, 65);
fill_run (iso_8859_1_string, 33, 26, 97);
fill_run (iso_8859_1_string, 59, 10, 48);
/* Initialize ebcdic_us_string. */
init_string (ebcdic_us_string,
167,
47, 22, 12,
37, 13, 5,
11, 74, 17);
/* In EBCDIC, the upper-case letters are broken into three separate runs. */
fill_run (ebcdic_us_string, 7, 9, 193);
fill_run (ebcdic_us_string, 16, 9, 209);
fill_run (ebcdic_us_string, 25, 8, 226);
/* The lower-case letters are, too. */
fill_run (ebcdic_us_string, 33, 9, 129);
fill_run (ebcdic_us_string, 42, 9, 145);
fill_run (ebcdic_us_string, 51, 8, 162);
/* The digits, at least, are contiguous. */
fill_run (ebcdic_us_string, 59, 10, 240);
/* Initialize ibm1047_string. */
init_string (ibm1047_string,
167,
47, 22, 12,
37, 13, 5,
11, 74, 17);
/* In IBM1047, the upper-case letters are broken into three separate runs. */
fill_run (ibm1047_string, 7, 9, 193);
fill_run (ibm1047_string, 16, 9, 209);
fill_run (ibm1047_string, 25, 8, 226);
/* The lower-case letters are, too. */
fill_run (ibm1047_string, 33, 9, 129);
fill_run (ibm1047_string, 42, 9, 145);
fill_run (ibm1047_string, 51, 8, 162);
/* The digits, at least, are contiguous. */
fill_run (ibm1047_string, 59, 10, 240);
init_utf32 ();
myvar = utf_32_string[7];
return 0; /* all strings initialized */
}