java emoje表情转标签存储及转换

EmojParseUtil
import lombok.extern.slf4j.Slf4j;
import org.apache.commons.lang3.StringUtils;

import java.io.UnsupportedEncodingException;
import java.net.URLDecoder;
import java.net.URLEncoder;
import java.util.regex.Matcher;
import java.util.regex.Pattern;

/**
 * @author chenyk
 * @description
 * @date 2023/1/10 11:52
 */
@Slf4j
public class EmojParseUtil {

    private EmojParseUtil(){

    }

    public static String emojiConvert(String str) {
        if (StringUtils.isBlank(str)){
            return "";
        }
        String patternString = "([\\x{10000}-\\x{10ffff}\ud800-\udfff])";

        Pattern pattern = Pattern.compile(patternString);
        Matcher matcher = pattern.matcher(str);
        StringBuffer sb = new StringBuffer();
        while(matcher.find()) {
            try {
                matcher.appendReplacement(
                        sb,
                        "[["
                                + URLEncoder.encode(matcher.group(1),
                                "UTF-8") + "]]");
            } catch(UnsupportedEncodingException e) {
                log.error("@ 转换emj表情为数据库字符,转换失败",e);
            }
        }
        matcher.appendTail(sb);
        log.info("@ 转换emj表情为数据库字符 【{}】 to 【{}】 , len:{}",str,sb.toString(),sb.length());
        return sb.toString();
    }

    /**
     * @Description 还原utf8数据库中保存的含转换后emoji表情的字符串
     * @param str
     * 转换后的字符串
     * @return 转换前的字符串
     * @throws UnsupportedEncodingException
     * exception
     */
    public static String emojiRecovery(String str) {
        if (StringUtils.isBlank(str)){
            return "";
        }
        String patternString = "\\[\\[(.*?)\\]\\]";

        Pattern pattern = Pattern.compile(patternString);
        Matcher matcher = pattern.matcher(str);

        StringBuffer sb = new StringBuffer();
        while(matcher.find()) {
            try {
                matcher.appendReplacement(sb,
                        URLDecoder.decode(matcher.group(1), "UTF-8"));
            } catch(UnsupportedEncodingException e) {
               log.error("@ 转换emj表情 数据库字符转表情失败",e);
            }
        }
        matcher.appendTail(sb);
        log.info("@ 转换 数据库字符转emj表情 【{}】 to 【{}】 , len:{}",str,sb.toString(),sb.length());
        return sb.toString();
    }
}

  

 
 
posted @ 2023-11-28 17:52  叶落の无痕  阅读(121)  评论(0)    收藏  举报