最初的主要问题
由于您尝试修改字符串文字(函数的参数),您会遇到分段错误。
字符串文字通常在只读内存中,可能不会被合法地修改。尝试这样做会导致未定义的行为。分段错误是一种合法的未定义行为。
如果你写了,你会没事的:
int main(void)
{
char str[] = "My Name is john ";
printf("output is %s", encodeSpace(str));
return 0;
}
甚至(使用 C99 复合文字):
int main(void)
{
printf("output is %s", encodeSpace((char[]){"My Name is john "}));
return 0;
}
算法问题
因为你可以在一个循环中递减tmp
两次,所以你不能保证在它到达orig
指针时识别出来。此代码在以下位置崩溃assert()
:
#include <assert.h>
#include <inttypes.h>
#include <stdio.h>
#include <string.h>
static
char *encodeSpace(char *str)
{
char *orig = str;
printf("-->> str = %p <<%s>>\n", (void *)str, str);
while (*str++)
;
str--;
char *tmp = --str;
while (*tmp-- == ' ')
;
tmp++;
printf("tmp = %p <<%s>>\n", (void *)tmp, tmp);
printf("str = %p <<%s>>\n", (void *)str, str);
while (tmp != orig)
{
while (*tmp != ' ' && tmp != orig)
{
printf("--1: tmp = %p <<%s>>; str = %p <<%s>>\n", (void *)tmp, tmp, (void *)str, str);
*str = *tmp; // segfault at this location..
tmp--;
str--;
printf("--2: tmp = %p <<%s>>; str = %p <<%s>>\n", (void *)tmp, tmp, (void *)str, str);
}
//if (tmp != orig)
//{
*str-- = '0';
*str-- = '2';
*str-- = '%';
tmp--;
//}
printf("--3: tmp = %p <<%s>>; str = %p <<%s>>\n", (void *)tmp, tmp, (void *)str, str);
assert(tmp >= orig);
}
printf("<<-- tmp = <<%s>>\n", tmp);
return tmp;
}
int main(void)
{
printf("output is <<%s>>\n", encodeSpace((char[]){"My name is John "}));
return 0;
}
删除评论,它不再崩溃(第二个减量tmp
是受保护的)。但输出并不是你想要的。
-->> str = 0x7fff54cb44c0 <<My name is John >>
tmp = 0x7fff54cb44ce <<n >>
str = 0x7fff54cb44d7 << >>
--1: tmp = 0x7fff54cb44ce <<n >>; str = 0x7fff54cb44d7 << >>
--2: tmp = 0x7fff54cb44cd <<hn n>>; str = 0x7fff54cb44d6 << n>>
--1: tmp = 0x7fff54cb44cd <<hn n>>; str = 0x7fff54cb44d6 << n>>
--2: tmp = 0x7fff54cb44cc <<ohn hn>>; str = 0x7fff54cb44d5 << hn>>
--1: tmp = 0x7fff54cb44cc <<ohn hn>>; str = 0x7fff54cb44d5 << hn>>
--2: tmp = 0x7fff54cb44cb <<John ohn>>; str = 0x7fff54cb44d4 << ohn>>
--1: tmp = 0x7fff54cb44cb <<John ohn>>; str = 0x7fff54cb44d4 << ohn>>
--2: tmp = 0x7fff54cb44ca << John John>>; str = 0x7fff54cb44d3 << John>>
--3: tmp = 0x7fff54cb44c9 <<s John %20John>>; str = 0x7fff54cb44d0 << %20John>>
--1: tmp = 0x7fff54cb44c9 <<s John %20John>>; str = 0x7fff54cb44d0 << %20John>>
--2: tmp = 0x7fff54cb44c8 <<is John s%20John>>; str = 0x7fff54cb44cf << s%20John>>
--1: tmp = 0x7fff54cb44c8 <<is John s%20John>>; str = 0x7fff54cb44cf << s%20John>>
--2: tmp = 0x7fff54cb44c7 << is Johnis%20John>>; str = 0x7fff54cb44ce <<nis%20John>>
--3: tmp = 0x7fff54cb44c6 <<e is J%20is%20John>>; str = 0x7fff54cb44cb <<J%20is%20John>>
--1: tmp = 0x7fff54cb44c6 <<e is J%20is%20John>>; str = 0x7fff54cb44cb <<J%20is%20John>>
--2: tmp = 0x7fff54cb44c5 <<me is e%20is%20John>>; str = 0x7fff54cb44ca << e%20is%20John>>
--1: tmp = 0x7fff54cb44c5 <<me is e%20is%20John>>; str = 0x7fff54cb44ca << e%20is%20John>>
--2: tmp = 0x7fff54cb44c4 <<ame isme%20is%20John>>; str = 0x7fff54cb44c9 <<sme%20is%20John>>
--1: tmp = 0x7fff54cb44c4 <<ame isme%20is%20John>>; str = 0x7fff54cb44c9 <<sme%20is%20John>>
--2: tmp = 0x7fff54cb44c3 <<name iame%20is%20John>>; str = 0x7fff54cb44c8 <<iame%20is%20John>>
--1: tmp = 0x7fff54cb44c3 <<name iame%20is%20John>>; str = 0x7fff54cb44c8 <<iame%20is%20John>>
--2: tmp = 0x7fff54cb44c2 << name name%20is%20John>>; str = 0x7fff54cb44c7 << name%20is%20John>>
--3: tmp = 0x7fff54cb44c1 <<y na%20name%20is%20John>>; str = 0x7fff54cb44c4 <<a%20name%20is%20John>>
--1: tmp = 0x7fff54cb44c1 <<y na%20name%20is%20John>>; str = 0x7fff54cb44c4 <<a%20name%20is%20John>>
--2: tmp = 0x7fff54cb44c0 <<My ny%20name%20is%20John>>; str = 0x7fff54cb44c3 <<ny%20name%20is%20John>>
--3: tmp = 0x7fff54cb44c0 <<My ny%20name%20is%20John>>; str = 0x7fff54cb44c3 <<ny%20name%20is%20John>>
<<-- tmp = <<My ny%20name%20is%20John>>
output is <<My ny%20name%20is%20John>>
我认为您的算法很复杂,因为您正试图就地进行更改。我不知道如何解决它。传入输入字符串(可以是字符串文字,并且不需要填充空白)和您在调用中指定大小的输出缓冲区会简单得多:
#include <stdio.h>
static int encodeSpace(char const *src, char *buffer, size_t buflen)
{
char *end = buffer + buflen;
char c;
char *dst = buffer;
while ((c = *src++) != '\0' && dst < end)
{
if (c != ' ')
*dst++ = c;
else if (dst < end - 3)
{
*dst++ = '%';
*dst++ = '2';
*dst++ = '0';
}
else
return -1;
}
*dst = '\0';
return 0;
}
int main(void)
{
char buffer[64];
if (encodeSpace("My name is John", buffer, sizeof(buffer)) == 0)
printf("output is <<%s>>\n", buffer);
return 0;
}
输出:
output is <<My%20name%20is%20John>>