成人免费xxxxx在线视频软件_久久精品久久久_亚洲国产精品久久久_天天色天天色_亚洲人成一区_欧美一级欧美三级在线观看

PHP 源碼探秘 - 為什么 trim 會(huì)導(dǎo)致亂碼

新聞 后端
本文通過(guò)對(duì)PHP源碼的探秘,揭示了 trim 會(huì)導(dǎo)致亂碼的原因。

[[206885]]

運(yùn)行以下代碼:

$tag = '互聯(lián)網(wǎng)產(chǎn)品、';
$text = rtrim($tag, "、");
print_r($text);

運(yùn)行,我們可能以為會(huì)得到的結(jié)果是 互聯(lián)網(wǎng)產(chǎn)品 ,實(shí)際結(jié)果是 互聯(lián)網(wǎng)產(chǎn)� 。為什么會(huì)這樣呢?

原理

trim 函數(shù)文檔

string trim ( string $str [, string $character_mask = " \t\n\r\0\x0B" ] )

該函數(shù)不是多字節(jié)函數(shù),也就是說(shuō),漢字這樣的多字節(jié)字符,會(huì)拿其頭或尾的單字節(jié)來(lái)和后面的 $character_mask 對(duì)應(yīng)的char數(shù)組進(jìn)行匹配,如果在后面的數(shù)組中,則刪掉,繼續(xù)匹配。比如:

echo ltrim("bcdf","abc"); // df

如下面的 demo 中的函數(shù) string_print_char 所示:

、 由 0xe3 0x80 0x81 三字節(jié)組成,

品 由 0xe5 0x93 0x81 三字節(jié)組成。

所以在執(zhí)行 rtrim 的時(shí)候,通過(guò)字節(jié)比對(duì),會(huì)將 0x81 去掉,導(dǎo)致了***出現(xiàn)了亂碼。

源碼精簡(jiǎn)版演示

查看 PHP7 的源碼,然后提煉出下面的小 demo ,方便大家一起學(xué)習(xí),其實(shí)PHP源碼的學(xué)習(xí)并不難,每天進(jìn)步一點(diǎn)點(diǎn)。

//
//  main.c
//  trim
//
//  Created by 周夢(mèng)康 on 2017/10/18.
//  Copyright © 2017年 周夢(mèng)康. All rights reserved.
//

#include <stdio.h>
#include <stdlib.h>
#include <string.h>

void string_print_char(char *str);
void php_charmask(unsigned char *input, size_t len, char *mask);
char *ltrim(char *str,char *character_mask);
char *rtrim(char *str,char *character_mask);


int main(int argc, char const *argv[])
{
    printf("%s\n",ltrim("bcdf","abc"));
    
    string_print_char("品"); // e5    93    81
    string_print_char("、"); // e3    80    81
    
    printf("%s\n",rtrim("互聯(lián)網(wǎng)產(chǎn)品、","、"));
    
    
    return 0;
}

char *ltrim(char *str,char *character_mask)
{
    char *res;
    char mask[256];
    register size_t i;
    int trimmed = 0;
    
    size_t len = strlen(str);
    
    php_charmask((unsigned char*)character_mask, strlen(character_mask), mask);
    
    for (i = 0; i < len; i++) {
        if (mask[(unsigned char)str[i]]) {
            trimmed++;
        } else {
            break;
        }
    }
    
    len -= trimmed;
    str += trimmed;
    
    res = (char *) malloc(sizeof(char) * (len+1));
    memcpy(res,str,len);
    
    return res;
}

char *rtrim(char *str,char *character_mask)
{
    char *res;
    char mask[256];
    register size_t i;
    
    size_t len = strlen(str);
    
    php_charmask((unsigned char*)character_mask, strlen(character_mask), mask);
    
    if (len > 0) {
        i = len - 1;
        do {
            if (mask[(unsigned char)str[i]]) {
                len--;
            } else {
                break;
            }
        } while (i-- != 0);
    }
    
    res = (char *) malloc(sizeof(char) * (len+1));
    memcpy(res,str,len);
    
    return res;
}

void string_print_char(char *str)
{
    unsigned long l = strlen(str);
    
    for (int i=0; i < l; i++) {
        printf("%02hhx\t",str[i]);
    }
    
    printf("\n");
}

void php_charmask(unsigned char *input, size_t len, char *mask)
{
    unsigned char *end;
    unsigned char c;
    
    memset(mask, 0, 256);
    
    for (end = input+len; input < end; input++) {
        c = *input;
        mask[c]= 1;
    }
}

PHP7 相關(guān)源碼

PHP_FUNCTION(trim)
{
    php_do_trim(INTERNAL_FUNCTION_PARAM_PASSTHRU, 3);
}
PHP_FUNCTION(rtrim)
{
    php_do_trim(INTERNAL_FUNCTION_PARAM_PASSTHRU, 2);
}
PHP_FUNCTION(ltrim)
{
    php_do_trim(INTERNAL_FUNCTION_PARAM_PASSTHRU, 1);
}
static void php_do_trim(INTERNAL_FUNCTION_PARAMETERS, int mode)
{
    zend_string *str;
    zend_string *what = NULL;

    ZEND_PARSE_PARAMETERS_START(1, 2)
        Z_PARAM_STR(str)
        Z_PARAM_OPTIONAL
        Z_PARAM_STR(what)
    ZEND_PARSE_PARAMETERS_END();

    ZVAL_STR(return_value, php_trim(str, (what ? ZSTR_VAL(what) : NULL), (what ? ZSTR_LEN(what) : 0), mode));
}
PHPAPI zend_string *php_trim(zend_string *str, char *what, size_t what_len, int mode)
{
    const char *c = ZSTR_VAL(str);
    size_t len = ZSTR_LEN(str);
    register size_t i;
    size_t trimmed = 0;
    char mask[256];

    if (what) {
        if (what_len == 1) {
            char p = *what;
            if (mode & 1) {
                for (i = 0; i < len; i++) {
                    if (c[i] == p) {
                        trimmed++;
                    } else {
                        break;
                    }
                }
                len -= trimmed;
                c += trimmed;
            }
            if (mode & 2) {
                if (len > 0) {
                    i = len - 1;
                    do {
                        if (c[i] == p) {
                            len--;
                        } else {
                            break;
                        }
                    } while (i-- != 0);
                }
            }
        } else {
            php_charmask((unsigned char*)what, what_len, mask);

            if (mode & 1) {
                for (i = 0; i < len; i++) {
                    if (mask[(unsigned char)c[i]]) {
                        trimmed++;
                    } else {
                        break;
                    }
                }
                len -= trimmed;
                c += trimmed;
            }
            if (mode & 2) {
                if (len > 0) {
                    i = len - 1;
                    do {
                        if (mask[(unsigned char)c[i]]) {
                            len--;
                        } else {
                            break;
                        }
                    } while (i-- != 0);
                }
            }
        }
    } else {
        if (mode & 1) {
            for (i = 0; i < len; i++) {
                if ((unsigned char)c[i] <= ' ' &&
                    (c[i] == ' ' || c[i] == '\n' || c[i] == '\r' || c[i] == '\t' || c[i] == '\v' || c[i] == '\0')) {
                    trimmed++;
                } else {
                    break;
                }
            }
            len -= trimmed;
            c += trimmed;
        }
        if (mode & 2) {
            if (len > 0) {
                i = len - 1;
                do {
                    if ((unsigned char)c[i] <= ' ' &&
                        (c[i] == ' ' || c[i] == '\n' || c[i] == '\r' || c[i] == '\t' || c[i] == '\v' || c[i] == '\0')) {
                        len--;
                    } else {
                        break;
                    }
                } while (i-- != 0);
            }
        }
    }

    if (ZSTR_LEN(str) == len) {
        return zend_string_copy(str);
    } else {
        return zend_string_init(c, len, 0);
    }
}
/* {{{ php_charmask
 * Fills a 256-byte bytemask with input. You can specify a range like 'a..z',
 * it needs to be incrementing.
 * Returns: FAILURE/SUCCESS whether the input was correct (i.e. no range errors)
 */
static inline int php_charmask(unsigned char *input, size_t len, char *mask)
{
    unsigned char *end;
    unsigned char c;
    int result = SUCCESS;

    memset(mask, 0, 256);
    for (end = input+len; input < end; input++) {
        c=*input;
        if ((input+3 < end) && input[1] == '.' && input[2] == '.'
                && input[3] >= c) {
            memset(mask+c, 1, input[3] - c + 1);
            input+=3;
        } else if ((input+1 < end) && input[0] == '.' && input[1] == '.') {
            /* Error, try to be as helpful as possible:
               (a range ending/starting with '.' won't be captured here) */
            if (end-len >= input) { /* there was no 'left' char */
                php_error_docref(NULL, E_WARNING, "Invalid '..'-range, no character to the left of '..'");
                result = FAILURE;
                continue;
            }
            if (input+2 >= end) { /* there is no 'right' char */
                php_error_docref(NULL, E_WARNING, "Invalid '..'-range, no character to the right of '..'");
                result = FAILURE;
                continue;
            }
            if (input[-1] > input[2]) { /* wrong order */
                php_error_docref(NULL, E_WARNING, "Invalid '..'-range, '..'-range needs to be incrementing");
                result = FAILURE;
                continue;
            }
            /* FIXME: better error (a..b..c is the only left possibility?) */
            php_error_docref(NULL, E_WARNING, "Invalid '..'-range");
            result = FAILURE;
            continue;
        } else {
            mask[c]=1;
        }
    }
    return result;
}
/* }}} */
責(zé)任編輯:張燕妮 來(lái)源: 周夢(mèng)康的博客
相關(guān)推薦

2020-10-15 09:35:27

亂碼UTF-8GBK

2024-07-18 20:18:51

2017-01-05 18:43:58

閏秒Linux服務(wù)器

2024-05-27 08:04:41

2024-05-27 08:01:15

2009-07-20 10:34:44

2021-08-10 09:58:59

ThreadLocal內(nèi)存泄漏

2021-01-25 07:14:53

Cloud DevOps云計(jì)算

2022-04-13 20:53:15

Spring事務(wù)管理

2023-03-22 09:10:18

IT文檔語(yǔ)言

2014-03-05 14:58:00

蘋果CarPlayiOS

2015-12-07 10:49:43

卸載App用戶體驗(yàn)

2022-05-11 08:22:54

IO負(fù)載NFSOS

2012-03-26 10:26:43

openstackeucalyptus

2012-05-02 10:08:51

桌面Linux微軟

2012-08-17 10:01:07

云計(jì)算

2021-07-09 09:24:06

NanoID UUID軟件開(kāi)發(fā)

2020-03-30 15:05:46

Kafka消息數(shù)據(jù)

2020-07-23 08:21:25

PHP開(kāi)發(fā)人員MVC

2020-06-10 14:10:53

服務(wù)開(kāi)發(fā) 架構(gòu)
點(diǎn)贊
收藏

51CTO技術(shù)棧公眾號(hào)

主站蜘蛛池模板: 成人在线视频免费播放 | 国产在线观看网站 | 91麻豆精品一区二区三区 | 欧美日韩成人一区二区 | 99免费视频 | 国产电影精品久久 | 成人av网站在线观看 | 亚洲国产成人久久久 | 情侣av| 97视频精品 | 成人不卡 | 日本特黄特色aaa大片免费 | 国产小视频自拍 | 成人在线电影在线观看 | 国产视频久久 | 成年人在线观看 | 中文字幕一区在线观看视频 | 日韩一区二区在线视频 | 国产精品美女久久久 | 九九热在线视频观看这里只有精品 | 日本一区二区在线视频 | 亚洲欧美一区二区三区在线 | 亚洲欧洲成人av每日更新 | 精品久久久一区 | 国产成人一区二 | 欧美日韩三级 | 波多野结衣一区二区三区 | 天天视频一区二区三区 | 亚洲国产精品久久 | 日韩在线播放网址 | 亚洲一区久久久 | 午夜免费在线观看 | 免费中文字幕日韩欧美 | 都市激情亚洲 | 亚洲精品一二区 | 日韩久久久一区二区 | 欧美亚洲国产日韩 | 欧美爱爱视频网站 | 欧美日韩毛片 | 99爱视频 | 亚洲欧美成人影院 |