Account for underscores when tokenizing mentions for autocompletion (#888)

* Account for underscores when tokenizing mentions for autocompletion Fixes #743 * Migrate MentionTokenizer to kotlin * Add tests for mention tokenizer
2018-10-19 17:44:46 +02:00 · 2018-10-19 17:44:46 +02:00 · af298e5281
commit af298e5281
parent 952d2a6512
3 changed files with 133 additions and 67 deletions
--- a/app/src/main/java/com/keylesspalace/tusky/util/MentionTokenizer.java
+++ b/app/src/main/java/com/keylesspalace/tusky/util/MentionTokenizer.java
@ -1,67 +0,0 @@
 /* Copyright 2017 Andrew Dawson
 *
 * This file is a part of Tusky.
 *
 * This program is free software; you can redistribute it and/or modify it under the terms of the
 * GNU General Public License as published by the Free Software Foundation; either version 3 of the
 * License, or (at your option) any later version.
 *
 * Tusky is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even
 * the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General
 * Public License for more details.
 *
 * You should have received a copy of the GNU General Public License along with Tusky; if not,
 * see <http://www.gnu.org/licenses>. */
 package com.keylesspalace.tusky.util;
 import android.text.SpannableString;
 import android.text.Spanned;
 import android.text.TextUtils;
 import android.widget.MultiAutoCompleteTextView;
 public class MentionTokenizer implements MultiAutoCompleteTextView.Tokenizer {
    @Override
    public int findTokenStart(CharSequence text, int cursor) {
        int i = cursor;
        while (i > 0 && text.charAt(i - 1) != '@') {
            if (!Character.isLetterOrDigit(text.charAt(i - 1))) return cursor;
            i--;
        }
        if (i < 1 || text.charAt(i - 1) != '@') {
            return cursor;
        }
        return i;
    }
    @Override
    public int findTokenEnd(CharSequence text, int cursor) {
        int i = cursor;
        int length = text.length();
        while (i < length) {
            if (text.charAt(i) == ' ') {
                return i;
            } else {
                i++;
            }
        }
        return length;
    }
    @Override
    public CharSequence terminateToken(CharSequence text) {
        int i = text.length();
        while (i > 0 && text.charAt(i - 1) == ' ') {
            i--;
        }
        if (i > 0 && text.charAt(i - 1) == ' ') {
            return text;
        } else if (text instanceof Spanned) {
            SpannableString s = new SpannableString(text + " ");
            TextUtils.copySpansFrom((Spanned) text, 0, text.length(), Object.class, s, 0);
            return s;
        } else {
            return text + " ";
        }
    }
 }
--- a/app/src/main/java/com/keylesspalace/tusky/util/MentionTokenizer.kt
+++ b/app/src/main/java/com/keylesspalace/tusky/util/MentionTokenizer.kt
@ -0,0 +1,72 @@
 /* Copyright 2017 Andrew Dawson
 *
 * This file is a part of Tusky.
 *
 * This program is free software; you can redistribute it and/or modify it under the terms of the
 * GNU General Public License as published by the Free Software Foundation; either version 3 of the
 * License, or (at your option) any later version.
 *
 * Tusky is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even
 * the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General
 * Public License for more details.
 *
 * You should have received a copy of the GNU General Public License along with Tusky; if not,
 * see <http://www.gnu.org/licenses>. */
 package com.keylesspalace.tusky.util
 import android.text.SpannableString
 import android.text.Spanned
 import android.text.TextUtils
 import android.widget.MultiAutoCompleteTextView
 class MentionTokenizer : MultiAutoCompleteTextView.Tokenizer {
    override fun findTokenStart(text: CharSequence, cursor: Int): Int {
        if (cursor == 0) {
            return cursor
        }
        var i = cursor
        var character = text[i - 1]
        while (i > 0 && character != '@') {
            // See SpanUtils.MENTION_REGEX
            if (!Character.isLetterOrDigit(character) && character != '_') {
                return cursor
            }
            i--
            character = if (i == 0) ' ' else text[i - 1]
        }
        if (i < 1 || character != '@') {
            return cursor
        }
        return i
    }
    override fun findTokenEnd(text: CharSequence, cursor: Int): Int {
        var i = cursor
        val length = text.length
        while (i < length) {
            if (text[i] == ' ') {
                return i
            } else {
                i++
            }
        }
        return length
    }
    override fun terminateToken(text: CharSequence): CharSequence {
        var i = text.length
        while (i > 0 && text[i - 1] == ' ') {
            i--
        }
        return if (i > 0 && text[i - 1] == ' ') {
            text
        } else if (text is Spanned) {
            val s = SpannableString(text.toString() + " ")
            TextUtils.copySpansFrom(text, 0, text.length, Object::class.java, s, 0)
            s
        } else {
            text.toString() + " "
        }
    }
 }
--- a/app/src/test/java/com/keylesspalace/tusky/MentionTokenizerTest.kt
+++ b/app/src/test/java/com/keylesspalace/tusky/MentionTokenizerTest.kt
@ -0,0 +1,61 @@
 /* Copyright 2018 Levi Bard
 *
 * This file is a part of Tusky.
 *
 * This program is free software; you can redistribute it and/or modify it under the terms of the
 * GNU General Public License as published by the Free Software Foundation; either version 3 of the
 * License, or (at your option) any later version.
 *
 * Tusky is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even
 * the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General
 * Public License for more details.
 *
 * You should have received a copy of the GNU General Public License along with Tusky; if not,
 * see <http://www.gnu.org/licenses>. */
 package com.keylesspalace.tusky
 import com.keylesspalace.tusky.util.MentionTokenizer
 import org.junit.Assert
 import org.junit.Test
 import org.junit.runner.RunWith
 import org.junit.runners.Parameterized
@RunWith(Parameterized::class)
 class MentionTokenizerTest(private val text: CharSequence,
    private val expectedStartIndex: Int,
    private val expectedEndIndex: Int) {
    companion object {
        @Parameterized.Parameters(name = "{0}")
        @JvmStatic
        fun data(): Iterable<Any> {
            return listOf(
                arrayOf("@mention", 1, 8),
                arrayOf("@ment10n", 1, 8),
                arrayOf("@ment10n_", 1, 9),
                arrayOf("@ment10n_n", 1, 10),
                arrayOf("@ment10n_9", 1, 10),
                arrayOf(" @mention", 2, 9),
                arrayOf(" @ment10n", 2, 9),
                arrayOf(" @ment10n_", 2, 10),
                arrayOf(" @ment10n_ @", 12, 12),
                arrayOf(" @ment10n_ @ment20n", 12, 19),
                arrayOf(" @ment10n_ @ment20n_", 12, 20),
                arrayOf(" @ment10n_ @ment20n_n", 12, 21),
                arrayOf(" @ment10n_ @ment20n_9", 12, 21),
                arrayOf("mention", 7, 7),
                arrayOf("ment10n", 7, 7),
                arrayOf("mentio_", 7, 7)
            )
        }
    }
    private val tokenizer = MentionTokenizer()
    @Test
    fun tokenIndices_matchExpectations() {
        Assert.assertEquals(expectedStartIndex, tokenizer.findTokenStart(text, text.length))
        Assert.assertEquals(expectedEndIndex, tokenizer.findTokenEnd(text, text.length))
    }
 }