Context Navigation

← Previous Changeset
Next Changeset →

Changeset a0fc4be in mainline

Timestamp:

2011-08-20T06:51:43Z (13 years ago)

Author:

Jakub Jermar <jakub@…>

Branches:

lfn, master, serial, ticket/834-toolchain-update, topic/msim-upgrade, topic/simplify-dev-export

Children:

0f4532e, 5fb32c5, abf04a54

Parents:

e3e4a2c (diff), b2727f18 (diff)
Note: this is a merge changeset, the changes displayed below correspond to the merge itself.
Use the (diff) links above to see all the changes relative to each parent.

Message:

Merge Martin Sucha's improvements to bdsh completion:

improved tokenizer
use tokenizer also in completion
display completion options in columns

Location:

Files:

: 5 edited

app/bdsh/compl.c (modified) (10 diffs)
app/bdsh/input.c (modified) (8 diffs)
app/bdsh/tok.c (modified) (14 diffs)
app/bdsh/tok.h (modified) (2 diffs)
lib/clui/tinput.c (modified) (2 diffs)

Legend:

: Unmodified
: Added
: Removed

uspace/app/bdsh/compl.c

-              re3e4a2c
+              ra0fc4be
 /*
  * Copyright (c) 2011 Jiri Svoboda
+ * Copyright (c) 2011 Martin Sucha
  * All rights reserved.
+ *
 …
 #include "compl.h"
 #include "exec.h"
+#include "tok.h"
 static int compl_init(wchar_t *text, size_t pos, size_t *cstart, void **state);
 …
+{
         compl_t *cs = NULL;
-        size_t p;
         size_t pref_size;
         char *stext = NULL;
 …
         static const char *dirlist_arg[] = { ".", NULL };
         int retval;
+        tokenizer_t tok;
+        token_t tokens[WORD_MAX];
+        unsigned int current_token;
+        size_t tokens_length;
         cs = calloc(1, sizeof(compl_t));
 …
+        }
-        /*
-         * Copy token pointed to by caret from start up to the caret.
-         * XXX Ideally we would use the standard tokenizer.
-         */
-        p = pos;
-        while (p > 0 && text[p - 1] != (wchar_t) ' ')
-                --p;
-        *cstart = p;
         /* Convert text buffer to string */
         stext = wstr_to_astr(text + *cstart);
+        stext = wstr_to_astr(text);
         if (stext == NULL) {
                 retval = ENOMEM;
                 goto error;
+        }
+        /* Extract the prefix being completed */
+        /* Tokenize the input string */
+        retval = tok_init(&tok, stext, tokens, WORD_MAX);
+        if (retval != EOK) {
+                goto error;
+        }
+        retval = tok_tokenize(&tok, &tokens_length);
+        if (retval != EOK) {
+                goto error;
+        }
+        /* Find the current token */
+        for (current_token = 0; current_token < tokens_length; current_token++) {
+                token_t *t = &tokens[current_token];
+                size_t end = t->char_start + t->char_length;
+                /* Check if the caret lies inside the token or immediately
+                 * after it
+                 */
+                if (t->char_start <= pos && pos <= end) {
+                        break;
+                }
+        }
+        if (tokens[current_token].type != TOKTYPE_SPACE) {
+                *cstart = tokens[current_token].char_start;
+        }
+        else {
+                *cstart = pos;
+        }
+        /* Extract the prefix being completed
+         * XXX: handle strings, etc.
+         */
         pref_size = str_lsize(stext, pos - *cstart);
         prefix = malloc(pref_size + 1);
 …
+        }
+        str_ncpy(prefix, pref_size + 1, stext, pref_size);
+        str_ncpy(prefix, pref_size + 1, stext +
+            tokens[current_token].byte_start, pref_size);
         /*
 …
          * We look at the previous token. If there is none or it is a pipe
          * ('|'), it is a command, otherwise it is an argument.
-         * XXX Again we should use the standard tokenizer/parser.
          */
         /* Skip any whitespace before current token */
+        while (p > 0 && text[p - 1] == (wchar_t) ' ')
+                --p;
+        int prev_token = current_token - 1;
+        if (prev_token != -1 && tokens[prev_token].type == TOKTYPE_SPACE) {
+                prev_token--;
+        }
         /*
 …
          * follows a pipe token.
          */
         if (p == 0 || text[p - 1] == '|')
+        if (prev_token == -1 || tokens[prev_token].type == TOKTYPE_SPACE)
                 cs->is_command = true;
         else
 …
         cs->prefix_len = str_length(cs->prefix);
+        tok_fini(&tok);
         *state = cs;
 …
 error:
         /* Error cleanup */
+        tok_fini(&tok);
         if (cs != NULL && cs->path_list != NULL) {

uspace/app/bdsh/input.c

-              re3e4a2c
+              ra0fc4be
  * Copyright (c) 2008 Tim Post
  * Copyright (c) 2011 Jiri Svoboda
+ * Copyright (c) 2011 Martin Sucha
  * All rights reserved.
+ *
 …
+{
         char *cmd[WORD_MAX];
+        token_t tokens_space[WORD_MAX];
+        token_t *tokens = tokens_space;
         int rc = 0;
         tokenizer_t tok;
+        int i, pipe_count, processed_pipes;
+        int pipe_pos[2];
+        char **actual_cmd;
+        unsigned int i, pipe_count, processed_pipes;
+        unsigned int pipe_pos[2];
         char *redir_from = NULL;
         char *redir_to = NULL;
 …
                 return CL_EFAIL;
         rc = tok_init(&tok, usr->line, cmd, WORD_MAX);
+        rc = tok_init(&tok, usr->line, tokens, WORD_MAX);
         if (rc != EOK) {
                 goto finit;
+        }
+        rc = tok_tokenize(&tok);
+        size_t tokens_length;
+        rc = tok_tokenize(&tok, &tokens_length);
         if (rc != EOK) {
                 goto finit;
+        }
+        if (tokens_length > 0 && tokens[0].type == TOKTYPE_SPACE) {
+                tokens++;
+                tokens_length--;
+        }
+        if (tokens_length > 0 && tokens[tokens_length-1].type == TOKTYPE_SPACE) {
+                tokens_length--;
+        }
 …
          * First find the pipes and check that there are no more
          */
+        int cmd_length = 0;
+        for (i = 0, pipe_count = 0; cmd[i] != NULL; i++, cmd_length++) {
+                if (cmd[i][0] == '|') {
+        for (i = 0, pipe_count = 0; i < tokens_length; i++) {
+                if (tokens[i].type == TOKTYPE_PIPE) {
                         if (pipe_count >= 2) {
                                 print_pipe_usage();
 …
+        }
+        actual_cmd = cmd;
+        unsigned int cmd_token_start = 0;
+        unsigned int cmd_token_end = tokens_length;
         processed_pipes = 0;
         /* Check if the first part (from <file> |) is present */
         if (pipe_count > 0 && pipe_pos[0] == 2 && str_cmp(cmd[0], "from") == 0) {
+        if (pipe_count > 0 && (pipe_pos[0] == 3 || pipe_pos[0] == 4) && str_cmp(tokens[0].text, "from") == 0) {
                 /* Ignore the first three tokens (from, file, pipe) and set from */
                 redir_from = cmd[1];
                 actual_cmd = cmd + 3;
+                redir_from = tokens[2].text;
+                cmd_token_start = pipe_pos[0]+1;
                 processed_pipes++;
+        }
 …
         /* Check if the second part (| to <file>) is present */
         if ((pipe_count - processed_pipes) > 0 &&
+            pipe_pos[processed_pipes] == cmd_length - 3 &&
+            str_cmp(cmd[cmd_length-2], "to") == 0) {
+            (pipe_pos[processed_pipes] == tokens_length - 4 ||
+            (pipe_pos[processed_pipes] == tokens_length - 5 &&
+            tokens[tokens_length-4].type == TOKTYPE_SPACE )) &&
+            str_cmp(tokens[tokens_length-3].text, "to") == 0) {
                 /* Ignore the last three tokens (pipe, to, file) and set to */
+                redir_to = cmd[cmd_length-1];
+                cmd[cmd_length-3] = NULL;
+                cmd_length -= 3;
+                redir_to = tokens[tokens_length-1].text;
+                cmd_token_end = pipe_pos[processed_pipes];
                 processed_pipes++;
+        }
 …
+        }
+        if (actual_cmd[0] == NULL) {
+        /* Convert tokens of the command to string array */
+        unsigned int cmd_pos = 0;
+        for (i = cmd_token_start; i < cmd_token_end; i++) {
+                if (tokens[i].type != TOKTYPE_SPACE) {
+                        cmd[cmd_pos++] = tokens[i].text;
+                }
+        }
+        cmd[cmd_pos++] = NULL;
+        if (cmd[0] == NULL) {
                 print_pipe_usage();
                 rc = ENOTSUP;
 …
+        }
         rc = run_command(actual_cmd, usr, &new_iostate);
+        rc = run_command(cmd, usr, &new_iostate);
 finit_with_files:

uspace/app/bdsh/tok.c

-              re3e4a2c
+              ra0fc4be
 static bool tok_pending_chars(tokenizer_t *);
 static int tok_finish_string(tokenizer_t *);
+static void tok_start_token(tokenizer_t *, token_type_t);
 /** Initialize the token parser
 …
  * @param max_tokens number of elements of the out_tokens array
  */
 int tok_init(tokenizer_t *tok, char *input, char **out_tokens,
+int tok_init(tokenizer_t *tok, char *input, token_t *out_tokens,
     size_t max_tokens)
+{
         tok->in = input;
         tok->in_offset = 0;
+        tok->last_in_offset = 0;
+        tok->in_char_offset = 0;
+        tok->last_in_char_offset = 0;
         tok->outtok = out_tokens;
         tok->outtok_offset = 0;
+        /* Leave one slot for a null terminator */
+        assert(max_tokens > 0);
+        tok->outtok_size = max_tokens - 1;
+        tok->outtok_size = max_tokens;
         /* Prepare a buffer where all the token strings will be stored */
 …
 /** Tokenize the input string into the tokens */
 int tok_tokenize(tokenizer_t *tok)
+int tok_tokenize(tokenizer_t *tok, size_t *tokens_length)
+{
         int rc;
         wchar_t cur_char;
+        wchar_t next_char;
         /* Read the input line char by char and append tokens */
+        while ((cur_char = tok_get_char(tok)) != 0) {
+                if (cur_char == ' ') {
+                        /* Spaces delimit tokens, but are not processed in any way
+                         * Push the token if there is any.
+        while ((next_char = tok_look_char(tok)) != 0) {
+                if (next_char == ' ') {
+                        /* Push the token if there is any.
                          * There may not be any pending char for a token in case
                          * there are several spaces in the input.
 …
+                                }
+                        }
+                }
+                else if (cur_char == '|') {
+                        /* Pipes are tokens that are delimiters and should be output
+                         * as a separate token
+                        tok_start_token(tok, TOKTYPE_SPACE);
+                        /* Eat all the spaces */
+                        while (tok_look_char(tok) == ' ') {
+                                tok_push_char(tok, tok_get_char(tok));
+                        }
+                        tok_push_token(tok);
+                }
+                else if (next_char == '|') {
+                        /* Pipes are tokens that are delimiters and should be
+                         * output as a separate token
                          */
                         if (tok_pending_chars(tok)) {
 …
+                        }
+                        rc = tok_push_char(tok, '|');
+                        tok_start_token(tok, TOKTYPE_PIPE);
+                        rc = tok_push_char(tok, tok_get_char(tok));
                         if (rc != EOK) {
                                 return rc;
 …
+                        }
+                }
                 else if (cur_char == '\'') {
+                else if (next_char == '\'') {
                         /* A string starts with a quote (') and ends again with a quote.
                          * A literal quote is written as ''
                          */
+                        tok_start_token(tok, TOKTYPE_TEXT);
+                        /* Eat the quote */
+                        tok_get_char(tok);
                         rc = tok_finish_string(tok);
                         if (rc != EOK) {
 …
+                }
                 else {
+                        if (!tok_pending_chars(tok)) {
+                                tok_start_token(tok, TOKTYPE_TEXT);
+                        }
                         /* If we are handling any other character, just append it to
                          * the current token.
                          */
                         rc = tok_push_char(tok, cur_char);
+                        rc = tok_push_char(tok, tok_get_char(tok));
                         if (rc != EOK) {
                                 return rc;
 …
+        }
+        /* We always have a space for the terminator, as we
+         * reserved it in tok_init */
+        tok->outtok[tok->outtok_offset] = 0;
+        *tokens_length = tok->outtok_offset;
         return EOK;
 …
+{
         int rc;
+        wchar_t cur_char;
+        while ((cur_char = tok_get_char(tok)) != 0) {
+                if (cur_char == '\'') {
+        wchar_t next_char;
+        while ((next_char = tok_look_char(tok)) != 0) {
+                if (next_char == '\'') {
+                        /* Eat the quote */
+                        tok_get_char(tok);
                         if (tok_look_char(tok) == '\'') {
                                 /* Encode a single literal quote */
 …
+                }
                 else {
                         rc = tok_push_char(tok, cur_char);
+                        rc = tok_push_char(tok, tok_get_char(tok));
                         if (rc != EOK) {
                                 return rc;
 …
 wchar_t tok_get_char(tokenizer_t *tok)
+{
+        tok->in_char_offset++;
         return str_decode(tok->in, &tok->in_offset, STR_NO_LIMIT);
+}
 …
 wchar_t tok_look_char(tokenizer_t *tok)
+{
+        size_t old_offset = tok->in_offset;
+        unsigned int old_offset = tok->in_offset;
+        unsigned int old_char_offset = tok->in_char_offset;
         wchar_t ret = tok_get_char(tok);
         tok->in_offset = old_offset;
+        tok->in_char_offset = old_char_offset;
         return ret;
+}
 …
+}
+void tok_start_token(tokenizer_t *tok, token_type_t type)
+{
+        tok->current_type = type;
+}
 /** Push the current token to the output array */
 int tok_push_token(tokenizer_t *tok)
 …
         tok->outbuf[tok->outbuf_offset++] = 0;
+        tok->outtok[tok->outtok_offset++] = tok->outbuf + tok->outbuf_last_start;
+        token_t *tokinfo = &tok->outtok[tok->outtok_offset++];
+        tokinfo->type = tok->current_type;
+        tokinfo->text = tok->outbuf + tok->outbuf_last_start;
+        tokinfo->byte_start = tok->last_in_offset;
+        tokinfo->byte_length = tok->in_offset - tok->last_in_offset;
+        tokinfo->char_start = tok->last_in_char_offset;
+        tokinfo->char_length = tok->in_char_offset - tok->last_in_char_offset;
         tok->outbuf_last_start = tok->outbuf_offset;
+        /* We have consumed the first char of the next token already */
+        tok->last_in_offset = tok->in_offset;
+        tok->last_in_char_offset = tok->in_char_offset;
         return EOK;

uspace/app/bdsh/tok.h

-              re3e4a2c
+              ra0fc4be
 #define TOK_H
+typedef enum {
+        TOKTYPE_TEXT,
+        TOKTYPE_PIPE,
+        TOKTYPE_SPACE
+} token_type_t;
+typedef struct {
+        char *text;
+        unsigned int byte_start;
+        unsigned int char_start;
+        size_t byte_length;
+        size_t char_length;
+        token_type_t type;
+} token_t;
 typedef struct {
         char *in;
+        size_t in_offset;
+        unsigned int in_offset;
+        unsigned int last_in_offset;
+        unsigned int in_char_offset;
+        unsigned int last_in_char_offset;
         char *outbuf;
 …
         size_t outbuf_last_start;
+        char **outtok;
+        token_t *outtok;
+        token_type_t current_type;
         size_t outtok_offset;
         size_t outtok_size;
 } tokenizer_t;
 extern int tok_init(tokenizer_t *, char *, char **, size_t);
+extern int tok_init(tokenizer_t *, char *, token_t *, size_t);
 extern void tok_fini(tokenizer_t *);
 extern int tok_tokenize(tokenizer_t *);
+extern int tok_tokenize(tokenizer_t *, size_t *);
 #endif

uspace/lib/clui/tinput.c

-              re3e4a2c
+              ra0fc4be
+}
+/* Print a list of completions */
+static void tinput_show_completions(tinput_t *ti, char **compl, size_t cnum)
+{
+        unsigned int i;
+        /* Determine the maximum length of the completion in chars */
+        size_t max_length = 0;
+        for (i = 0; i < cnum; i++)
+                max_length = max(max_length, str_length(compl[i]));
+        unsigned int cols = max(1, (ti->con_cols + 1) / (max_length + 1));
+        unsigned int col_width = ti->con_cols / cols;
+        unsigned int rows = cnum / cols + ((cnum % cols) != 0);
+        unsigned int row, col;
+        for (row = 0; row < rows; row++) {
+                bool wlc = false;
+                for (col = 0; col < cols; col++) {
+                        size_t compl_idx = col * rows + row;
+                        if (compl_idx >= cnum)
+                                break;
+                        if (col)
+                                printf(" ");
+                        printf("%s", compl[compl_idx]);
+                        size_t compl_len = str_length(compl[compl_idx]);
+                        if (col == cols -1) {
+                                wlc = (compl_len == max_length);
+                        }
+                        else {
+                                for (i = compl_len; i < col_width; i++) {
+                                        printf(" ");
+                                }
+                        }
+                }
+                if (!wlc) printf("\n");
+        }
+}
 static void tinput_text_complete(tinput_t *ti)
+{
 …
                         tinput_jump_after(ti);
+                        for (i = 0; i < cnum; i++)
+                                printf("%s\n", compl[i]);
+                        tinput_show_completions(ti, compl, cnum);
                         tinput_display(ti);
+                }

Note: See TracChangeset for help on using the changeset viewer.

Download in other formats: