aboutsummaryrefslogtreecommitdiffhomepage
path: root/src/qreg-commands.c
diff options
context:
space:
mode:
authorRobin Haberkorn <robin.haberkorn@googlemail.com>2024-09-04 12:49:29 +0200
committerRobin Haberkorn <robin.haberkorn@googlemail.com>2024-09-09 18:22:21 +0200
commitb31b88717172e22b49c0493185f603b8f84989ec (patch)
tree43850d7d04e721987b89c37c68f24e657b5cb9c6 /src/qreg-commands.c
parentb85edaa0021c06d63fee6d8904fc822815e8b933 (diff)
downloadsciteco-b31b88717172e22b49c0493185f603b8f84989ec.tar.gz
the ^EUq string building escape now respects the encoding (can insert bytes or codepoints) (refs #5)
* This is trickier than it sounds because there isn't one single place to consult. It depends on the context. If the string argument relates to buffer contents - as in <I>, <S>, <FR> etc. - the buffer's encoding is consulted. If it goes into a register (EU), the register's encoding is consulted. Everything else (O, EN, EC, ES...) expects only Unicode codepoints. * This is communicated through a new field teco_machine_stringbuilding_t::codepage which must be set in the states' initial callback. * Seems overkill just for ^EUq, but it can be used for context-sensitive processing of all the other string building constructs as well. * ^V and ^W cannot be supported for Unicode characters for the time being without an Unicode-aware parser
Diffstat (limited to 'src/qreg-commands.c')
-rw-r--r--src/qreg-commands.c18
1 files changed, 18 insertions, 0 deletions
diff --git a/src/qreg-commands.c b/src/qreg-commands.c
index 09b2b90..1bde944 100644
--- a/src/qreg-commands.c
+++ b/src/qreg-commands.c
@@ -470,6 +470,23 @@ TECO_DEFINE_STATE_EXPECTQREG(teco_state_eucommand,
.expectqreg.type = TECO_QREG_OPTIONAL_INIT
);
+static gboolean
+teco_state_setqregstring_building_initial(teco_machine_main_t *ctx, GError **error)
+{
+ if (ctx->mode > TECO_MODE_NORMAL)
+ return TRUE;
+
+ teco_qreg_t *qreg;
+ teco_machine_qregspec_get_results(ctx->expectqreg, &qreg, NULL);
+
+ /*
+ * The expected codepage of string building constructs is determined
+ * by the Q-Register.
+ */
+ teco_undo_guint(ctx->expectstring.machine.codepage) = qreg->vtable->get_codepage(qreg);
+ return TRUE;
+}
+
static teco_state_t *
teco_state_setqregstring_building_done(teco_machine_main_t *ctx, const teco_string_t *str, GError **error)
{
@@ -487,6 +504,7 @@ teco_state_setqregstring_building_done(teco_machine_main_t *ctx, const teco_stri
* characters \fBenabled\fP.
*/
TECO_DEFINE_STATE_EXPECTSTRING(teco_state_setqregstring_building,
+ .initial_cb = (teco_state_initial_cb_t)teco_state_setqregstring_building_initial,
.expectstring.string_building = TRUE
);