0

此代码将空格替换%20为 char 数组应该包含足够的空格以添加%20.

你能帮我理解为什么我会出现段*str = *tmp; // segfault at this location..错误吗?

#include <stdio.h>
#include <string.h>


char* encodeSpace(char* str) {
    char *orig = str;
    while (*str++);

     str--;
     char *tmp = --str;
     while (*tmp-- == ' ');
     tmp++;
     while (tmp != orig) {
        while(*tmp != ' ' && tmp != orig) {

        *str = *tmp; // segfault at this location.. 
         tmp--;
         str--;
        }
        *str-- = '0';
        *str-- = '2';
        *str-- = '%';
        tmp--;
     }
     return tmp;
}

main()
{
   printf("output is %s", encodeSpace("My Name is john         "));
}
4

2 回答 2

3

最初的主要问题

由于您尝试修改字符串文字(函数的参数),您会遇到分段错误。

字符串文字通常在只读内存中,可能不会被合法地修改。尝试这样做会导致未定义的行为。分段错误是一种合法的未定义行为。

如果你写了,你会没事的:

int main(void)
{
    char str[] = "My Name is john         ";
    printf("output is %s", encodeSpace(str));
    return 0;
}

甚至(使用 C99 复合文字):

int main(void)
{
    printf("output is %s", encodeSpace((char[]){"My Name is john         "}));
    return 0;
}

算法问题

因为你可以在一个循环中递减tmp两次,所以你不能保证在它到达orig指针时识别出来。此代码在以下位置崩溃assert()

#include <assert.h>
#include <inttypes.h>
#include <stdio.h>
#include <string.h>

static
char *encodeSpace(char *str)
{
    char *orig = str;
    printf("-->> str = %p <<%s>>\n", (void *)str, str);

    while (*str++)
        ;

    str--;
    char *tmp = --str;
    while (*tmp-- == ' ')
        ;
    tmp++;
    printf("tmp = %p <<%s>>\n", (void *)tmp, tmp);
    printf("str = %p <<%s>>\n", (void *)str, str);
    while (tmp != orig)
    {
        while (*tmp != ' ' && tmp != orig)
        {
            printf("--1: tmp = %p <<%s>>; str = %p <<%s>>\n", (void *)tmp, tmp, (void *)str, str);
            *str = *tmp; // segfault at this location..
            tmp--;
            str--;
            printf("--2: tmp = %p <<%s>>; str = %p <<%s>>\n", (void *)tmp, tmp, (void *)str, str);
        }
        //if (tmp != orig)
        //{
        *str-- = '0';
        *str-- = '2';
        *str-- = '%';
        tmp--;
        //}
        printf("--3: tmp = %p <<%s>>; str = %p <<%s>>\n", (void *)tmp, tmp, (void *)str, str);
        assert(tmp >= orig);
    }
    printf("<<-- tmp = <<%s>>\n", tmp);
    return tmp;
}

int main(void)
{
    printf("output is <<%s>>\n", encodeSpace((char[]){"My name is John         "}));
    return 0;
}

删除评论,它不再崩溃(第二个减量tmp是受保护的)。但输出并不是你想要的。

-->> str = 0x7fff54cb44c0 <<My name is John         >>
tmp = 0x7fff54cb44ce <<n         >>
str = 0x7fff54cb44d7 << >>
--1: tmp = 0x7fff54cb44ce <<n         >>; str = 0x7fff54cb44d7 << >>
--2: tmp = 0x7fff54cb44cd <<hn        n>>; str = 0x7fff54cb44d6 << n>>
--1: tmp = 0x7fff54cb44cd <<hn        n>>; str = 0x7fff54cb44d6 << n>>
--2: tmp = 0x7fff54cb44cc <<ohn       hn>>; str = 0x7fff54cb44d5 << hn>>
--1: tmp = 0x7fff54cb44cc <<ohn       hn>>; str = 0x7fff54cb44d5 << hn>>
--2: tmp = 0x7fff54cb44cb <<John      ohn>>; str = 0x7fff54cb44d4 << ohn>>
--1: tmp = 0x7fff54cb44cb <<John      ohn>>; str = 0x7fff54cb44d4 << ohn>>
--2: tmp = 0x7fff54cb44ca << John     John>>; str = 0x7fff54cb44d3 << John>>
--3: tmp = 0x7fff54cb44c9 <<s John  %20John>>; str = 0x7fff54cb44d0 << %20John>>
--1: tmp = 0x7fff54cb44c9 <<s John  %20John>>; str = 0x7fff54cb44d0 << %20John>>
--2: tmp = 0x7fff54cb44c8 <<is John s%20John>>; str = 0x7fff54cb44cf << s%20John>>
--1: tmp = 0x7fff54cb44c8 <<is John s%20John>>; str = 0x7fff54cb44cf << s%20John>>
--2: tmp = 0x7fff54cb44c7 << is Johnis%20John>>; str = 0x7fff54cb44ce <<nis%20John>>
--3: tmp = 0x7fff54cb44c6 <<e is J%20is%20John>>; str = 0x7fff54cb44cb <<J%20is%20John>>
--1: tmp = 0x7fff54cb44c6 <<e is J%20is%20John>>; str = 0x7fff54cb44cb <<J%20is%20John>>
--2: tmp = 0x7fff54cb44c5 <<me is e%20is%20John>>; str = 0x7fff54cb44ca << e%20is%20John>>
--1: tmp = 0x7fff54cb44c5 <<me is e%20is%20John>>; str = 0x7fff54cb44ca << e%20is%20John>>
--2: tmp = 0x7fff54cb44c4 <<ame isme%20is%20John>>; str = 0x7fff54cb44c9 <<sme%20is%20John>>
--1: tmp = 0x7fff54cb44c4 <<ame isme%20is%20John>>; str = 0x7fff54cb44c9 <<sme%20is%20John>>
--2: tmp = 0x7fff54cb44c3 <<name iame%20is%20John>>; str = 0x7fff54cb44c8 <<iame%20is%20John>>
--1: tmp = 0x7fff54cb44c3 <<name iame%20is%20John>>; str = 0x7fff54cb44c8 <<iame%20is%20John>>
--2: tmp = 0x7fff54cb44c2 << name name%20is%20John>>; str = 0x7fff54cb44c7 << name%20is%20John>>
--3: tmp = 0x7fff54cb44c1 <<y na%20name%20is%20John>>; str = 0x7fff54cb44c4 <<a%20name%20is%20John>>
--1: tmp = 0x7fff54cb44c1 <<y na%20name%20is%20John>>; str = 0x7fff54cb44c4 <<a%20name%20is%20John>>
--2: tmp = 0x7fff54cb44c0 <<My ny%20name%20is%20John>>; str = 0x7fff54cb44c3 <<ny%20name%20is%20John>>
--3: tmp = 0x7fff54cb44c0 <<My ny%20name%20is%20John>>; str = 0x7fff54cb44c3 <<ny%20name%20is%20John>>
<<-- tmp = <<My ny%20name%20is%20John>>
output is <<My ny%20name%20is%20John>>

我认为您的算法很复杂,因为您正试图就地进行更改。我不知道如何解决它。传入输入字符串(可以是字符串文字,并且不需要填充空白)和您在调用中指定大小的输出缓冲区会简单得多:

#include <stdio.h>

static int encodeSpace(char const *src, char *buffer, size_t buflen)
{
    char *end = buffer + buflen;
    char c;
    char *dst = buffer;

    while ((c = *src++) != '\0' && dst < end)
    {
        if (c != ' ')
            *dst++ = c;
        else if (dst < end - 3)
        {
            *dst++ = '%';
            *dst++ = '2';
            *dst++ = '0';
        }
        else
            return -1;
    }
    *dst = '\0';
    return 0;
}

int main(void)
{
    char buffer[64];

    if (encodeSpace("My name is John", buffer, sizeof(buffer)) == 0)
        printf("output is <<%s>>\n", buffer);

    return 0;
}

输出:

output is <<My%20name%20is%20John>>
于 2013-10-19T04:03:16.230 回答
0

@Jonathan Leffler 的解决方案非常完美。

我试图修复原始算法,但看起来很难更改原始字符缓冲区,因为%20需要三个字符位置,如果space字符不够,代码仍然会出错。

如果空间足够,则以下代码效果很好。

#include <stdio.h>
#include <string.h>


char* encodeSpace(char* str) {
    char *orig = str;
    while (*str++);

     str--;
     char *tmp = --str;
     while (*tmp == ' ') tmp--;
     tmp++;
     while (tmp != orig) {
        while(*tmp != ' ') {
         *str = *tmp;
         str--;
         if (tmp == orig)
            break;
         else
           tmp--;
        }
        if (*tmp == ' ') {
          *str-- = '0';
          *str-- = '2';
          *str-- = '%';
          while (*tmp == ' ') tmp--;
        } 
     }
     return ++str;
}

int main()
{

    char str[] = "My Name is john            ";
   printf("output is %s\n", encodeSpace(str));
   return 0;
}
于 2013-10-19T05:57:11.897 回答