added sanity checking in the linearization builder

This commit is contained in:
krangelov
2021-11-18 10:33:20 +01:00
parent ec76223b41
commit 71020baa5e
2 changed files with 351 additions and 102 deletions

View File

@@ -1155,170 +1155,424 @@ class PGF_INTERNAL PgfLinBuilder : public PgfLinBuilderIface
size_t seq_index; size_t seq_index;
size_t sym_index; size_t sym_index;
const char *builder_error_msg =
"Detected incorrect use of the linearization builder";
public: public:
PgfLinBuilder(ref<PgfConcrLin> lin) { PgfLinBuilder(ref<PgfAbsFun> absfun, PgfConcr *concr, size_t n_prods)
this->lin = lin; {
ref<PgfConcrLincat> lincat =
namespace_lookup(concr->lincats, &absfun->type->name);
if (lincat == 0) {
throw pgf_error("Missing linearization category");
}
lin = PgfDB::malloc<PgfConcrLin>(absfun->name.size+1);
memcpy(&lin->name, &absfun->name, sizeof(PgfText)+absfun->name.size+1);
lin->ref_count = 1;
lin->absfun = absfun;
lin->args = vector_new<PgfPArg>(n_prods*absfun->type->hypos->len);
lin->res = vector_new<ref<PgfLParam>>(n_prods);
lin->seqs = vector_new<ref<Vector<PgfSymbol>>>(n_prods*lincat->fields->len);
this->arg_index = 0; this->arg_index = 0;
this->res_index = 0; this->res_index = 0;
this->seq_index = 0; this->seq_index = 0;
this->sym_index = 0; this->sym_index = (size_t) -1;
} }
void start_production(PgfExn *err) void start_production(PgfExn *err)
{ {
if (err->type != PGF_EXN_NONE)
return;
PGF_API_BEGIN {
if (res_index >= lin->res->len)
throw pgf_error(builder_error_msg);
*vector_elem(lin->res, res_index) = 0;
} PGF_API_END
} }
void add_argument(size_t i0, size_t n_terms, size_t *terms, PgfExn *err) void add_argument(size_t i0, size_t n_terms, size_t *terms, PgfExn *err)
{ {
ref<PgfLParam> param = PgfDB::malloc<PgfLParam>(n_terms*2*sizeof(size_t)); if (err->type != PGF_EXN_NONE)
param->i0 = i0; return;
param->n_terms = n_terms;
for (size_t i = 0; i < n_terms; i++) { PGF_API_BEGIN {
param->terms[i].factor = terms[2*i]; if (arg_index >= lin->args->len)
param->terms[i].var = terms[2*i+1]; throw pgf_error(builder_error_msg);
}
ref<PgfPArg> parg = vector_elem(lin->args, arg_index); ref<PgfLParam> param = PgfDB::malloc<PgfLParam>(n_terms*2*sizeof(size_t));
parg->param = param; param->i0 = i0;
param->n_terms = n_terms;
arg_index++; for (size_t i = 0; i < n_terms; i++) {
param->terms[i].factor = terms[2*i];
param->terms[i].var = terms[2*i+1];
}
ref<PgfPArg> parg = vector_elem(lin->args, arg_index);
parg->param = param;
arg_index++;
} PGF_API_END
} }
void set_result(size_t i0, size_t n_terms, size_t *terms, PgfExn *err) void set_result(size_t i0, size_t n_terms, size_t *terms, PgfExn *err)
{ {
ref<PgfLParam> param = PgfDB::malloc<PgfLParam>(n_terms*2*sizeof(size_t)); if (err->type != PGF_EXN_NONE)
param->i0 = i0; return;
param->n_terms = n_terms;
for (size_t i = 0; i < n_terms; i++) { PGF_API_BEGIN {
param->terms[i].factor = terms[2*i]; if (res_index >= lin->res->len)
param->terms[i].var = terms[2*i+1]; throw pgf_error(builder_error_msg);
}
*vector_elem(lin->res, res_index) = param; ref<PgfLParam> param = PgfDB::malloc<PgfLParam>(n_terms*2*sizeof(size_t));
param->i0 = i0;
param->n_terms = n_terms;
for (size_t i = 0; i < n_terms; i++) {
param->terms[i].factor = terms[2*i];
param->terms[i].var = terms[2*i+1];
}
*vector_elem(lin->res, res_index) = param;
} PGF_API_END
} }
void start_sequence(size_t n_syms, PgfExn *err) void start_sequence(size_t n_syms, PgfExn *err)
{ {
*vector_elem(lin->seqs, seq_index) = vector_new<PgfSymbol>(n_syms); if (err->type != PGF_EXN_NONE)
sym_index = 0; return;
PGF_API_BEGIN {
if (seq_index >= lin->seqs->len)
throw pgf_error(builder_error_msg);
*vector_elem(lin->seqs, seq_index) = vector_new<PgfSymbol>(n_syms);
sym_index = 0;
} PGF_API_END
} }
void add_symcat(size_t d, size_t i0, size_t n_terms, size_t *terms, PgfExn *err) void add_symcat(size_t d, size_t i0, size_t n_terms, size_t *terms, PgfExn *err)
{ {
ref<PgfSymbolCat> symcat = PgfDB::malloc<PgfSymbolCat>(n_terms*2*sizeof(size_t)); if (err->type != PGF_EXN_NONE)
symcat->d = d; return;
symcat->r.i0 = i0;
symcat->r.n_terms = n_terms;
for (size_t i = 0; i < n_terms; i++) { PGF_API_BEGIN {
symcat->r.terms[i].factor = terms[2*i]; if (sym_index == (size_t) -1)
symcat->r.terms[i].var = terms[2*i+1]; throw pgf_error(builder_error_msg);
}
ref<Vector<PgfSymbol>> syms = *vector_elem(lin->seqs, seq_index); if (seq_index >= lin->seqs->len)
*vector_elem(syms, sym_index) = ref<PgfSymbolCat>::tagged(symcat); throw pgf_error(builder_error_msg);
sym_index++; ref<Vector<PgfSymbol>> syms = *vector_elem(lin->seqs, seq_index);
if (sym_index >= syms->len)
throw pgf_error(builder_error_msg);
ref<PgfSymbolCat> symcat = PgfDB::malloc<PgfSymbolCat>(n_terms*2*sizeof(size_t));
symcat->d = d;
symcat->r.i0 = i0;
symcat->r.n_terms = n_terms;
for (size_t i = 0; i < n_terms; i++) {
symcat->r.terms[i].factor = terms[2*i];
symcat->r.terms[i].var = terms[2*i+1];
}
*vector_elem(syms, sym_index) = ref<PgfSymbolCat>::tagged(symcat);
sym_index++;
} PGF_API_END
} }
void add_symlit(size_t d, size_t i0, size_t n_terms, size_t *terms, PgfExn *err) void add_symlit(size_t d, size_t i0, size_t n_terms, size_t *terms, PgfExn *err)
{ {
ref<PgfSymbolLit> symlit = PgfDB::malloc<PgfSymbolLit>(n_terms*2*sizeof(size_t)); if (err->type != PGF_EXN_NONE)
symlit->d = d; return;
symlit->r.i0 = i0;
symlit->r.n_terms = n_terms;
for (size_t i = 0; i < n_terms; i++) { PGF_API_BEGIN {
symlit->r.terms[i].factor = terms[2*i]; if (sym_index == (size_t) -1)
symlit->r.terms[i].var = terms[2*i+1]; throw pgf_error(builder_error_msg);
}
ref<Vector<PgfSymbol>> syms = *vector_elem(lin->seqs, seq_index); if (seq_index >= lin->seqs->len)
*vector_elem(syms, sym_index) = ref<PgfSymbolLit>::tagged(symlit); throw pgf_error(builder_error_msg);
sym_index++; ref<Vector<PgfSymbol>> syms = *vector_elem(lin->seqs, seq_index);
if (sym_index >= syms->len)
throw pgf_error(builder_error_msg);
ref<PgfSymbolLit> symlit = PgfDB::malloc<PgfSymbolLit>(n_terms*2*sizeof(size_t));
symlit->d = d;
symlit->r.i0 = i0;
symlit->r.n_terms = n_terms;
for (size_t i = 0; i < n_terms; i++) {
symlit->r.terms[i].factor = terms[2*i];
symlit->r.terms[i].var = terms[2*i+1];
}
*vector_elem(syms, sym_index) = ref<PgfSymbolLit>::tagged(symlit);
sym_index++;
} PGF_API_END
} }
void add_symvar(size_t d, size_t r, PgfExn *err) void add_symvar(size_t d, size_t r, PgfExn *err)
{ {
ref<PgfSymbolVar> symvar = PgfDB::malloc<PgfSymbolVar>(); if (err->type != PGF_EXN_NONE)
symvar->d = d; return;
symvar->r = r;
ref<Vector<PgfSymbol>> syms = *vector_elem(lin->seqs, seq_index); PGF_API_BEGIN {
*vector_elem(syms, sym_index) = ref<PgfSymbolVar>::tagged(symvar); if (sym_index == (size_t) -1)
throw pgf_error(builder_error_msg);
sym_index++; if (seq_index >= lin->seqs->len)
throw pgf_error(builder_error_msg);
ref<Vector<PgfSymbol>> syms = *vector_elem(lin->seqs, seq_index);
if (sym_index >= syms->len)
throw pgf_error(builder_error_msg);
ref<PgfSymbolVar> symvar = PgfDB::malloc<PgfSymbolVar>();
symvar->d = d;
symvar->r = r;
*vector_elem(syms, sym_index) = ref<PgfSymbolVar>::tagged(symvar);
sym_index++;
} PGF_API_END
} }
void add_symks(PgfText *token, PgfExn *err) void add_symks(PgfText *token, PgfExn *err)
{ {
ref<PgfSymbolKS> symtok = PgfDB::malloc<PgfSymbolKS>(token->size+1); if (err->type != PGF_EXN_NONE)
memcpy(&symtok->token, token, sizeof(PgfText)+token->size+1); return;
ref<Vector<PgfSymbol>> syms = *vector_elem(lin->seqs, seq_index); PGF_API_BEGIN {
*vector_elem(syms, sym_index) = ref<PgfSymbolKS>::tagged(symtok); if (sym_index == (size_t) -1)
throw pgf_error(builder_error_msg);
sym_index++; if (seq_index >= lin->seqs->len)
throw pgf_error(builder_error_msg);
ref<Vector<PgfSymbol>> syms = *vector_elem(lin->seqs, seq_index);
if (sym_index >= syms->len)
throw pgf_error(builder_error_msg);
ref<PgfSymbolKS> symtok = PgfDB::malloc<PgfSymbolKS>(token->size+1);
memcpy(&symtok->token, token, sizeof(PgfText)+token->size+1);
*vector_elem(syms, sym_index) = ref<PgfSymbolKS>::tagged(symtok);
sym_index++;
} PGF_API_END
} }
void add_symbind(PgfExn *err) void add_symbind(PgfExn *err)
{ {
ref<Vector<PgfSymbol>> syms = *vector_elem(lin->seqs, seq_index); if (err->type != PGF_EXN_NONE)
*vector_elem(syms, sym_index) = ref<PgfSymbolBIND>::tagged(0); return;
sym_index++; PGF_API_BEGIN {
if (sym_index == (size_t) -1)
throw pgf_error(builder_error_msg);
if (seq_index >= lin->seqs->len)
throw pgf_error(builder_error_msg);
ref<Vector<PgfSymbol>> syms = *vector_elem(lin->seqs, seq_index);
if (sym_index >= syms->len)
throw pgf_error(builder_error_msg);
*vector_elem(syms, sym_index) = ref<PgfSymbolBIND>::tagged(0);
sym_index++;
} PGF_API_END
} }
void add_symsoftbind(PgfExn *err) void add_symsoftbind(PgfExn *err)
{ {
ref<Vector<PgfSymbol>> syms = *vector_elem(lin->seqs, seq_index); if (err->type != PGF_EXN_NONE)
*vector_elem(syms, sym_index) = ref<PgfSymbolSOFTBIND>::tagged(0); return;
sym_index++; PGF_API_BEGIN {
if (sym_index == (size_t) -1)
throw pgf_error(builder_error_msg);
if (seq_index >= lin->seqs->len)
throw pgf_error(builder_error_msg);
ref<Vector<PgfSymbol>> syms = *vector_elem(lin->seqs, seq_index);
if (sym_index >= syms->len)
throw pgf_error(builder_error_msg);
*vector_elem(syms, sym_index) = ref<PgfSymbolSOFTBIND>::tagged(0);
sym_index++;
} PGF_API_END
} }
void add_symne(PgfExn *err) void add_symne(PgfExn *err)
{ {
ref<Vector<PgfSymbol>> syms = *vector_elem(lin->seqs, seq_index); if (err->type != PGF_EXN_NONE)
*vector_elem(syms, sym_index) = ref<PgfSymbolNE>::tagged(0); return;
sym_index++; PGF_API_BEGIN {
if (sym_index == (size_t) -1)
throw pgf_error(builder_error_msg);
if (seq_index >= lin->seqs->len)
throw pgf_error(builder_error_msg);
ref<Vector<PgfSymbol>> syms = *vector_elem(lin->seqs, seq_index);
if (sym_index >= syms->len)
throw pgf_error(builder_error_msg);
*vector_elem(syms, sym_index) = ref<PgfSymbolNE>::tagged(0);
sym_index++;
} PGF_API_END
} }
void add_symsoftspace(PgfExn *err) void add_symsoftspace(PgfExn *err)
{ {
ref<Vector<PgfSymbol>> syms = *vector_elem(lin->seqs, seq_index); if (err->type != PGF_EXN_NONE)
*vector_elem(syms, sym_index) = ref<PgfSymbolSOFTSPACE>::tagged(0); return;
sym_index++; PGF_API_BEGIN {
if (sym_index == (size_t) -1)
throw pgf_error(builder_error_msg);
if (seq_index >= lin->seqs->len)
throw pgf_error(builder_error_msg);
ref<Vector<PgfSymbol>> syms = *vector_elem(lin->seqs, seq_index);
if (sym_index >= syms->len)
throw pgf_error(builder_error_msg);
*vector_elem(syms, sym_index) = ref<PgfSymbolSOFTSPACE>::tagged(0);
sym_index++;
} PGF_API_END
} }
void add_symcapit(PgfExn *err) void add_symcapit(PgfExn *err)
{ {
ref<Vector<PgfSymbol>> syms = *vector_elem(lin->seqs, seq_index); if (err->type != PGF_EXN_NONE)
*vector_elem(syms, sym_index) = ref<PgfSymbolCAPIT>::tagged(0); return;
sym_index++; PGF_API_BEGIN {
if (sym_index == (size_t) -1)
throw pgf_error(builder_error_msg);
if (seq_index >= lin->seqs->len)
throw pgf_error(builder_error_msg);
ref<Vector<PgfSymbol>> syms = *vector_elem(lin->seqs, seq_index);
if (sym_index >= syms->len)
throw pgf_error(builder_error_msg);
*vector_elem(syms, sym_index) = ref<PgfSymbolCAPIT>::tagged(0);
sym_index++;
} PGF_API_END
} }
void add_symallcapit(PgfExn *err) void add_symallcapit(PgfExn *err)
{ {
ref<Vector<PgfSymbol>> syms = *vector_elem(lin->seqs, seq_index); if (err->type != PGF_EXN_NONE)
*vector_elem(syms, sym_index) = ref<PgfSymbolALLCAPIT>::tagged(0); return;
sym_index++; PGF_API_BEGIN {
if (sym_index == (size_t) -1)
throw pgf_error(builder_error_msg);
if (seq_index >= lin->seqs->len)
throw pgf_error(builder_error_msg);
ref<Vector<PgfSymbol>> syms = *vector_elem(lin->seqs, seq_index);
if (sym_index >= syms->len)
throw pgf_error(builder_error_msg);
*vector_elem(syms, sym_index) = ref<PgfSymbolALLCAPIT>::tagged(0);
} PGF_API_END
} }
void end_sequence(PgfExn *err) { void end_sequence(PgfExn *err)
seq_index++; {
if (err->type != PGF_EXN_NONE)
return;
PGF_API_BEGIN {
if (sym_index != (*vector_elem(lin->seqs, seq_index))->len)
throw pgf_error(builder_error_msg);
sym_index = (size_t) -1;
seq_index++;
} PGF_API_END
} }
void end_production(PgfExn *err) void end_production(PgfExn *err)
{ {
this->res_index++; if (err->type != PGF_EXN_NONE)
return;
PGF_API_BEGIN {
size_t n_args = (lin->args->len/lin->res->len);
if (arg_index != (res_index+1)*n_args)
throw pgf_error(builder_error_msg);
if (*vector_elem(lin->res, res_index) == 0)
throw pgf_error(builder_error_msg);
size_t n_seqs = (lin->seqs->len/lin->res->len);
if (seq_index != (res_index+1)*n_seqs)
throw pgf_error(builder_error_msg);
res_index++;
} PGF_API_END
}
ref<PgfConcrLin> done()
{
if (res_index != lin->res->len)
throw pgf_error(builder_error_msg);
return lin;
}
void failed()
{
for (size_t i = 0; i < arg_index; i++) {
PgfDB::free(vector_elem(lin->args, i)->param);
}
PgfDB::free(lin->args);
for (size_t i = 0; i < res_index; i++) {
PgfDB::free(*vector_elem(lin->res, i));
}
PgfDB::free(lin->res);
for (size_t i = 0; i < seq_index; i++) {
ref<Vector<PgfSymbol>> syms = *vector_elem(lin->seqs, i);
for (size_t j = 0; j < syms->len; j++) {
PgfSymbol sym = *vector_elem(syms, j);
PgfDB::free(ref<void>::untagged(sym));
}
PgfDB::free(syms);
}
if (sym_index != (size_t) -1) {
ref<Vector<PgfSymbol>> syms = *vector_elem(lin->seqs, seq_index);
for (size_t j = 0; j < sym_index; j++) {
PgfSymbol sym = *vector_elem(syms, j);
PgfDB::free(ref<void>::untagged(sym));
}
PgfDB::free(syms);
}
PgfDB::free(lin->seqs);
PgfDB::free(lin);
lin = 0;
} }
}; };
@@ -1394,27 +1648,17 @@ void pgf_create_lin(PgfDB *db,
throw pgf_error("There is no corresponding function in the abstract syntax"); throw pgf_error("There is no corresponding function in the abstract syntax");
} }
ref<PgfConcrLincat> lincat = PgfLinBuilder builder(absfun, concr, n_prods);
namespace_lookup(concr->lincats, &absfun->type->name);
if (lincat == 0) {
throw pgf_error("Missing linearization category");
}
ref<PgfConcrLin> lin = PgfDB::malloc<PgfConcrLin>(name->size+1);
memcpy(&lin->name, name, sizeof(PgfText)+name->size+1);
lin->ref_count = 1;
lin->absfun = absfun;
lin->args = vector_new<PgfPArg>(n_prods*absfun->type->hypos->len);
lin->res = vector_new<ref<PgfLParam>>(n_prods);
lin->seqs = vector_new<ref<Vector<PgfSymbol>>>(n_prods*lincat->fields->len);
PgfLinBuilder builder(lin);
build->build(&builder, err); build->build(&builder, err);
if (err->type == PGF_EXN_NONE) {
Namespace<PgfConcrLin> lins = ref<PgfConcrLin> lin = builder.done();
namespace_insert(concr->lins, lin); Namespace<PgfConcrLin> lins =
namespace_release(concr->lins); namespace_insert(concr->lins, lin);
concr->lins = lins; namespace_release(concr->lins);
concr->lins = lins;
} else {
builder.failed();
}
} PGF_API_END } PGF_API_END
} }

View File

@@ -31,7 +31,6 @@ import PGF2.Expr
import Foreign import Foreign
import Foreign.C import Foreign.C
import Control.Monad
import Control.Exception import Control.Exception
#include <pgf/pgf.h> #include <pgf/pgf.h>
@@ -243,17 +242,24 @@ createLin name prods = Transaction $ \c_db c_abstr c_revision c_exn ->
(#poke PgfBuildLinIfaceVtbl, build) vtbl c_callback (#poke PgfBuildLinIfaceVtbl, build) vtbl c_callback
pgf_create_lin c_db c_abstr c_revision c_name (fromIntegral (length prods)) c_build c_exn pgf_create_lin c_db c_abstr c_revision c_name (fromIntegral (length prods)) c_build c_exn
where where
forM_ [] c_exn f = return ()
forM_ (x:xs) c_exn f = do
ex_type <- (#peek PgfExn, type) c_exn
if (ex_type :: (#type PgfExnType)) == (#const PGF_EXN_NONE)
then f x >> forM_ xs c_exn f
else return ()
build _ c_builder c_exn = do build _ c_builder c_exn = do
vtbl <- (#peek PgfLinBuilderIface, vtbl) c_builder vtbl <- (#peek PgfLinBuilderIface, vtbl) c_builder
forM_ prods $ \(Production args res seqs) -> do forM_ prods c_exn $ \(Production args res seqs) -> do
fun <- (#peek PgfLinBuilderIfaceVtbl, start_production) vtbl fun <- (#peek PgfLinBuilderIfaceVtbl, start_production) vtbl
callLinBuilder0 fun c_builder c_exn callLinBuilder0 fun c_builder c_exn
fun <- (#peek PgfLinBuilderIfaceVtbl, add_argument) vtbl fun <- (#peek PgfLinBuilderIfaceVtbl, add_argument) vtbl
forM_ args $ \(PArg _ param) -> forM_ args c_exn $ \(PArg _ param) ->
callLParam (callLinBuilder3 fun c_builder) param c_exn callLParam (callLinBuilder3 fun c_builder) param c_exn
fun <- (#peek PgfLinBuilderIfaceVtbl, set_result) vtbl fun <- (#peek PgfLinBuilderIfaceVtbl, set_result) vtbl
callLParam (callLinBuilder3 fun c_builder) res c_exn callLParam (callLinBuilder3 fun c_builder) res c_exn
forM_ seqs $ \syms -> do forM_ seqs c_exn $ \syms -> do
fun <- (#peek PgfLinBuilderIfaceVtbl, start_sequence) vtbl fun <- (#peek PgfLinBuilderIfaceVtbl, start_sequence) vtbl
callLinBuilder1 fun c_builder (fromIntegral (length syms)) c_exn callLinBuilder1 fun c_builder (fromIntegral (length syms)) c_exn
mapM_ (addSymbol c_builder vtbl c_exn) syms mapM_ (addSymbol c_builder vtbl c_exn) syms
@@ -261,7 +267,6 @@ createLin name prods = Transaction $ \c_db c_abstr c_revision c_exn ->
callLinBuilder0 fun c_builder c_exn callLinBuilder0 fun c_builder c_exn
fun <- (#peek PgfLinBuilderIfaceVtbl, end_production) vtbl fun <- (#peek PgfLinBuilderIfaceVtbl, end_production) vtbl
callLinBuilder0 fun c_builder c_exn callLinBuilder0 fun c_builder c_exn
return ()
addSymbol c_builder vtbl c_exn (SymCat d r) = do addSymbol c_builder vtbl c_exn (SymCat d r) = do
fun <- (#peek PgfLinBuilderIfaceVtbl, add_symcat) vtbl fun <- (#peek PgfLinBuilderIfaceVtbl, add_symcat) vtbl