Skip to content

Commit

Permalink
Add support for collating sequences on indexed files
Browse files Browse the repository at this point in the history
  • Loading branch information
ddeclerck committed Jan 30, 2024
1 parent 824f2a6 commit fab88f5
Show file tree
Hide file tree
Showing 14 changed files with 658 additions and 58 deletions.
6 changes: 6 additions & 0 deletions NEWS
Original file line number Diff line number Diff line change
Expand Up @@ -10,6 +10,9 @@ NEWS - user visible changes -*- outline -*-
the error output for format errors (for example invalid indicator column)
is now limitted to 5 per source file

** support the COLLATING SEQUENCE clause on indexed files
(currently only with the BDB backend)

more work in progress

* Important Bugfixes
Expand All @@ -28,6 +31,9 @@ NEWS - user visible changes -*- outline -*-
build system do not correctly work together to locate files from
diagnostic output

** New option -fdefault-file-colseq to specify the default
file collating sequence

* More notable changes

** execution times were significantly reduced for the following:
Expand Down
13 changes: 13 additions & 0 deletions cobc/ChangeLog
Original file line number Diff line number Diff line change
@@ -1,4 +1,17 @@

2024-01-25 David Declerck <[email protected]>

FR #459: support COLLATING SEQUENCE clause on SELECT / INDEXED files
* codegen.c (output_file_initialization): output the indexed
file/keys collating sequence (were already present in the AST)
* tree.c (validate_indexed_key_field): process postponed
key collating sequences
* parser.y (collating_sequence_clause, collating_sequence_clause_key):
replace CB_PENDING by CB_UNFINISHED on file and key collating sequence
* flag.def, tree.c, tree.h, cobc.c, parser.y: add and handle a new
-fdefault-file-colseq flag to specify the default collating
sequence to use for files without a collating sequence clause

2023-11-29 Fabrice Le Fessant <[email protected]>

* cobc.c (cobc_clean_up): when save-temps specifies a directory,
Expand Down
42 changes: 25 additions & 17 deletions cobc/cobc.c
Original file line number Diff line number Diff line change
Expand Up @@ -90,22 +90,23 @@ enum compile_level {
CB_LEVEL_EXECUTABLE = 7
};

#define CB_FLAG_GETOPT_STACK_SIZE 1
#define CB_FLAG_GETOPT_IF_CUTOFF 2
#define CB_FLAG_GETOPT_SIGN 3
#define CB_FLAG_GETOPT_FOLD_COPY 4
#define CB_FLAG_GETOPT_FOLD_CALL 5
#define CB_FLAG_GETOPT_TTITLE 6
#define CB_FLAG_GETOPT_MAX_ERRORS 7
#define CB_FLAG_GETOPT_DUMP 8
#define CB_FLAG_GETOPT_CALLFH 9
#define CB_FLAG_GETOPT_INTRINSICS 10
#define CB_FLAG_GETOPT_EC 11
#define CB_FLAG_GETOPT_NO_EC 12
#define CB_FLAG_GETOPT_NO_DUMP 13
#define CB_FLAG_GETOPT_EBCDIC_TABLE 14
#define CB_FLAG_GETOPT_DEFAULT_COLSEQ 15
#define CB_FLAG_MEMORY_CHECK 16
#define CB_FLAG_GETOPT_STACK_SIZE 1
#define CB_FLAG_GETOPT_IF_CUTOFF 2
#define CB_FLAG_GETOPT_SIGN 3
#define CB_FLAG_GETOPT_FOLD_COPY 4
#define CB_FLAG_GETOPT_FOLD_CALL 5
#define CB_FLAG_GETOPT_TTITLE 6
#define CB_FLAG_GETOPT_MAX_ERRORS 7
#define CB_FLAG_GETOPT_DUMP 8
#define CB_FLAG_GETOPT_CALLFH 9
#define CB_FLAG_GETOPT_INTRINSICS 10
#define CB_FLAG_GETOPT_EC 11
#define CB_FLAG_GETOPT_NO_EC 12
#define CB_FLAG_GETOPT_NO_DUMP 13
#define CB_FLAG_GETOPT_EBCDIC_TABLE 14
#define CB_FLAG_GETOPT_DEFAULT_COLSEQ 15
#define CB_FLAG_GETOPT_DEFAULT_FILE_COLSEQ 16
#define CB_FLAG_MEMORY_CHECK 17


/* Info display limits */
Expand Down Expand Up @@ -3813,6 +3814,13 @@ process_command_line (const int argc, char **argv)
}
break;

case CB_FLAG_GETOPT_DEFAULT_FILE_COLSEQ: /* 16 */
/* -fdefault-file-colseq=<ASCII/EBCDIC/NATIVE> */
if (cb_deciph_default_file_colseq_name (cob_optarg)) {
cobc_err_exit (COBC_INV_PAR, "-fdefault-file-colseq");
}
break;

case CB_FLAG_GETOPT_FOLD_COPY: /* 4 */
/* -ffold-copy=<UPPER/LOWER> : COPY fold case */
if (!cb_strcasecmp (cob_optarg, "UPPER")) {
Expand Down Expand Up @@ -3892,7 +3900,7 @@ process_command_line (const int argc, char **argv)
}
break;

case CB_FLAG_MEMORY_CHECK: /* 16 */
case CB_FLAG_MEMORY_CHECK: /* 17 */
/* -fmemory-check=<scope> : */
if (!cob_optarg) {
cb_flag_memory_check = CB_MEMCHK_ALL;
Expand Down
40 changes: 40 additions & 0 deletions cobc/codegen.c
Original file line number Diff line number Diff line change
Expand Up @@ -9260,6 +9260,40 @@ output_key_components (struct cb_file* f, struct cb_key_component* key_component
}
}


static void
output_indexed_file_key_colseq (const struct cb_file *f, const struct cb_alt_key *ak, int idx)
{
cb_tree key = ak ? ak->key : f->key;
cb_tree key_col = ak ? ak->collating_sequence_key : f->collating_sequence_key;
int type = cb_tree_type (key, cb_code_field (key));
cb_tree col = NULL;

/* We only apply a collating sequence if the key is alphanumeric / display */
if ((type & COB_TYPE_ALNUM) || (type == COB_TYPE_NUMERIC_DISPLAY)) {
col = key_col ? key_col : f->collating_sequence;
#if 0
/* TODO: this should be done for national, when available */
} else if (type & COB_TYPE_NATIONAL) {
col = key_col_n ? key_col_n : f->collating_sequence_n;
#endif
}

output_prefix ();
if (idx == 0) {
output ("%s%s->collating_sequence = ", CB_PREFIX_KEYS, f->cname);
} else {
output ("(%s%s + %d)->collating_sequence = ", CB_PREFIX_KEYS, f->cname, idx);
}
if ((col != NULL) && CB_REFERENCE_P (col)) {
output_param (cb_ref(col), -1);
output (";");
} else {
output ("NULL;");
}
output_newline ();
}

static void
output_file_initialization (struct cb_file *f)
{
Expand Down Expand Up @@ -9320,6 +9354,9 @@ output_file_initialization (struct cb_file *f)
} else {
output_line ("%s%s->offset = 0;", CB_PREFIX_KEYS, f->cname);
}
if (f->organization == COB_ORG_INDEXED) {
output_indexed_file_key_colseq (f, NULL, 0);
}
nkeys = 1;
for (l = f->alt_key_list; l; l = l->next) {
output_prefix ();
Expand All @@ -9342,6 +9379,9 @@ output_file_initialization (struct cb_file *f)
f->cname, nkeys);
output_key_components (f, l->component_list, nkeys);
}
if (f->organization == COB_ORG_INDEXED) {
output_indexed_file_key_colseq (f, l, nkeys);
}
nkeys++;
}
#if 0 /* now done in cob_file_malloc / cob_file_external_addr */
Expand Down
4 changes: 4 additions & 0 deletions cobc/flag.def
Original file line number Diff line number Diff line change
Expand Up @@ -103,6 +103,10 @@ CB_FLAG_NQ (1, "default-colseq", CB_FLAG_GETOPT_DEFAULT_COLSEQ,
_(" -fdefault-colseq=[ASCII|EBCDIC|NATIVE]\tdefine default collating sequence\n"
" * default: NATIVE"))

CB_FLAG_NQ (1, "default-file-colseq", CB_FLAG_GETOPT_DEFAULT_FILE_COLSEQ,
_(" -fdefault-file-colseq=[ASCII|EBCDIC|NATIVE]\tdefine default file collating sequence\n"
" * default: NATIVE"))

/* Binary flags */

/* Flags with suppressed help */
Expand Down
45 changes: 17 additions & 28 deletions cobc/parser.y
Original file line number Diff line number Diff line change
Expand Up @@ -336,29 +336,6 @@ check_non_area_a (cb_tree stmt) {

/* Collating sequences */

/* Known collating sequences/alphabets */
enum cb_colseq {
CB_COLSEQ_NATIVE,
CB_COLSEQ_ASCII,
CB_COLSEQ_EBCDIC,
};
enum cb_colseq cb_default_colseq = CB_COLSEQ_NATIVE;

/* Decipher character conversion table names */
int cb_deciph_default_colseq_name (const char * const name)
{
if (!cb_strcasecmp (name, "ASCII")) {
cb_default_colseq = CB_COLSEQ_ASCII;
} else if (!cb_strcasecmp (name, "EBCDIC")) {
cb_default_colseq = CB_COLSEQ_EBCDIC;
} else if (!cb_strcasecmp (name, "NATIVE")) {
cb_default_colseq = CB_COLSEQ_NATIVE;
} else {
return 1;
}
return 0;
}

static cb_tree
build_colseq_tree (const char *alphabet_name,
int alphabet_type,
Expand Down Expand Up @@ -901,23 +878,34 @@ check_relaxed_syntax (const cob_flags_t lev)
}

static void
setup_default_collation (struct cb_program *program) {
switch (cb_default_colseq) {
prepare_default_collation (enum cb_colseq colseq) {
switch (colseq) {
#ifdef COB_EBCDIC_MACHINE
case CB_COLSEQ_ASCII:
#else
case CB_COLSEQ_EBCDIC:
#endif
alphanumeric_collation = build_colseq (cb_default_colseq);
alphanumeric_collation = build_colseq (colseq);
break;
default:
alphanumeric_collation = NULL;
}
national_collation = NULL; /* TODO: default national collation */
}

static void
setup_default_collation (struct cb_program *program) {
prepare_default_collation (cb_default_colseq);
program->collating_sequence = alphanumeric_collation;
program->collating_sequence_n = national_collation;
}

static void
setup_default_file_collation (struct cb_file *file) {
prepare_default_collation (cb_default_file_colseq);
file->collating_sequence = alphanumeric_collation;
}

static void
program_init_without_program_id (void)
{
Expand Down Expand Up @@ -5365,6 +5353,7 @@ file_control_entry:

}
key_type = NO_KEY;
setup_default_file_collation (current_file);
}
_select_clauses_or_error
{
Expand Down Expand Up @@ -5752,7 +5741,7 @@ collating_sequence_clause:
check_repeated ("COLLATING", SYN_CLAUSE_3, &check_duplicate);
current_file->collating_sequence = alphanumeric_collation;
current_file->collating_sequence_n = national_collation;
CB_PENDING ("FILE COLLATING SEQUENCE");
CB_UNFINISHED ("FILE COLLATING SEQUENCE");
}
;

Expand Down Expand Up @@ -5804,7 +5793,7 @@ collating_sequence_clause_key:
and also attached to the correct key later, so just store in a list here: */
current_file->collating_sequence_keys =
cb_list_add(current_file->collating_sequence_keys, CB_BUILD_PAIR ($6, $4));
CB_PENDING ("KEY COLLATING SEQUENCE");
CB_UNFINISHED ("KEY COLLATING SEQUENCE");
}
;

Expand Down
53 changes: 50 additions & 3 deletions cobc/tree.c
Original file line number Diff line number Diff line change
Expand Up @@ -4661,9 +4661,12 @@ validate_file (struct cb_file *f, cb_tree name)

static void
validate_indexed_key_field (struct cb_file *f, struct cb_field *records,
cb_tree key, struct cb_key_component *component_list)
cb_tree key, struct cb_key_component *component_list,
struct cb_alt_key *cbak)
{
cb_tree key_ref;
cb_tree l;

struct cb_field *k;
struct cb_field *p;
struct cb_field *v;
Expand Down Expand Up @@ -4730,6 +4733,18 @@ validate_indexed_key_field (struct cb_file *f, struct cb_field *records,
" needs to be at least %d"), f->record_min, k->name, field_end);
}
}

/* get key collating sequence, if any */
for (l = f->collating_sequence_keys; l; l = CB_CHAIN (l)) {
cb_tree alpha_key = CB_VALUE (l);
if (key_ref == cb_ref (CB_PAIR_Y (alpha_key))) {
if (cbak == NULL) {
f->collating_sequence_key = CB_PAIR_X (alpha_key);
} else {
cbak->collating_sequence_key = CB_PAIR_X (alpha_key);
}
}
}
}

void
Expand Down Expand Up @@ -4771,7 +4786,7 @@ finalize_file (struct cb_file *f, struct cb_field *records)
struct cb_alt_key *cbak;
if (f->key) {
validate_indexed_key_field (f, records,
f->key, f->component_list);
f->key, f->component_list, NULL);
}
for (cbak = f->alt_key_list; cbak; cbak = cbak->next) {
if (f->flag_global) {
Expand All @@ -4781,7 +4796,7 @@ finalize_file (struct cb_file *f, struct cb_field *records)
}
}
validate_indexed_key_field (f, records,
cbak->key, cbak->component_list);
cbak->key, cbak->component_list, cbak);
}
}

Expand Down Expand Up @@ -7414,6 +7429,38 @@ cb_build_ml_suppress_checks (struct cb_ml_generate_tree *tree)
}


enum cb_colseq cb_default_colseq = CB_COLSEQ_NATIVE;
enum cb_colseq cb_default_file_colseq = CB_COLSEQ_NATIVE;

/* Decipher character conversion table names */
static int
cb_deciph_colseq_name (const char * const name, enum cb_colseq *colseq)
{
if (!cb_strcasecmp (name, "ASCII")) {
*colseq = CB_COLSEQ_ASCII;
} else if (!cb_strcasecmp (name, "EBCDIC")) {
*colseq = CB_COLSEQ_EBCDIC;
} else if (!cb_strcasecmp (name, "NATIVE")) {
*colseq = CB_COLSEQ_NATIVE;
} else {
return 1;
}
return 0;
}

int
cb_deciph_default_colseq_name (const char * const name)
{
return cb_deciph_colseq_name (name, &cb_default_colseq);
}

int
cb_deciph_default_file_colseq_name (const char * const name)
{
return cb_deciph_colseq_name (name, &cb_default_file_colseq);
}


#ifndef HAVE_DESIGNATED_INITS
void
cobc_init_tree (void)
Expand Down
13 changes: 13 additions & 0 deletions cobc/tree.h
Original file line number Diff line number Diff line change
Expand Up @@ -2343,6 +2343,7 @@ extern cb_tree cb_debug_sub_3;
extern cb_tree cb_debug_contents;

extern int cb_deciph_default_colseq_name (const char *const);
extern int cb_deciph_default_file_colseq_name (const char *const);

extern struct cb_program *cb_build_program (struct cb_program *,
const int);
Expand Down Expand Up @@ -2740,5 +2741,17 @@ extern int cobc_has_areacheck_directive (const char *directive);
#define CB_CHAIN_PAIR(x,y,z) x = cb_pair_add (x, y, z)
#define CB_FIELD_ADD(x,y) x = cb_field_add (x, y)

enum cb_colseq {
CB_COLSEQ_NATIVE,
CB_COLSEQ_ASCII,
CB_COLSEQ_EBCDIC,
};

extern enum cb_colseq cb_default_colseq;
extern enum cb_colseq cb_default_file_colseq;

extern int cb_deciph_default_colseq_name (const char * const name);
extern int cb_deciph_default_file_colseq_name (const char * const name);


#endif /* CB_TREE_H */
8 changes: 8 additions & 0 deletions libcob/ChangeLog
Original file line number Diff line number Diff line change
@@ -1,4 +1,12 @@

2024-01-25 David Declerck <[email protected]>

FR #459: support COLLATING SEQUENCE clause on SELECT / INDEXED files
* fileio.c (bdb_setkeycol, bdb_bt_compare, indexed_open, ...):
take the file collating sequence into account when comparing keys
* common.c, coblocal.h: rename common_cmps to cob_cmps
and make it available locally

2023-12-14 David Declerck <[email protected]>

* common.c (cob_terminate_routines, cob_call_with_exception_check):
Expand Down
Loading

0 comments on commit fab88f5

Please sign in to comment.