搜狗的测试题，关于解码与编码

题外话：很久没更新了，前一阵子同时扛着两个项目，实在无暇他顾。如果结束了一个，又要开始找工作了。一直想着对自己做的项目总结一下，还是等这段时间过去吧。

今天投了搜狗校招，邮件通知我去做测试。旁边的MM打开测试网页发现提示说恭喜她已经通过测试了，而我打开了俨然一个题目放在那里，说30分钟做完。

题目给出了一个编码的函数，要求给出解码部分的代码，然后执行程序，将运行结果提交。代码如下

#include  <stdio.h> 
#include  <stdlib.h> 
#include  "stdint.h" 
#include  <assert.h> 
#include  <string.h> 


int  encode(const  void*  raw_in,  void*  raw_out,  uint32_t  password,  size_t  len) 
{ 
  const  uint8_t*  in  =  (const  uint8_t*)raw_in; 
  uint8_t*  out  =  (uint8_t*)raw_out; 

  uint32_t  seed  =  password  ^  0x48879c19u; 
  for  (size_t  i  =  0  ;  i  <  len;  ++i)  { 
    uint8_t  a  =  (  in[i]  ^  seed  )  >>  4; 
    uint8_t  b  =  (  (  ((uint32_t)in[i])  <<  11  )  ^  seed  )  >>  (11-4); 
    a  &=  15; 
    b  &=  240; 
    a  =  15  &  (  a  ^  (b  <<  3)); 
    out[i]  =  a  |  b; 
    seed  =  ((seed  ^  in[i])  *  144123481  +  in[i]); 
  }
  return 0;
} 


int  decode(const  void*  raw_in,  void*  raw_out,  uint32_t  password,  size_t  len) 
{ 
  const  uint8_t*  in  =  (const  uint8_t*)raw_in; 
  uint8_t*  out  =  (uint8_t*)raw_out; 

  uint32_t  seed  =  password  ^  0x48879c19u; 
  for  (size_t  i  =  0  ;  i  <  len;  ++i)  { 
    //  请?在?此?处?补?全?代?码?
  } 
  return 0;
} 
int  main() 
{ 
  const  uint8_t  buf1[]  =  {0xc7,  0x23,  0xed,  0x9b,  0x26,  0x0b,  0x51,  0xe4,  0x79,  0x5d,  0x57,  0x0d,  0xbb,  0xca,  0x5d,  0x28,  0xa4,  0xf9,  0x60,  0xcc,  0x65,  0x35,  0x82,  0xa9,  0x2e,  0xe6,  0x03,  0x7c,  0x7d,  0x49,  0x1f,  0x58,  0x0e,  0xbe,  0xd5,  0x49,  0x68,  0x44,  }; 
  uint8_t  buf2[100]  =  {}; 
  const  uint32_t  password  =  0xf765d3bau; 
  const  size_t  len  =  sizeof(buf1); 
  decode(buf1,  buf2,  password,  len); 
  printf("%s\n",  buf2); 
}

我刚看到这段代码时头晕眼花，不喜欢这样的代码风格。硬着头皮读了一下编码的函数，在纸上仔细推理一番，原来是将in[i]与seed做个异或操作，之后a为in[i]的高4位，b为in[i]的低4位，然后交换a和b的位置。

a = 15 & ( a ^ (b << 3)); 这句可以完全不必理会，要得到原有的字节，只需将a和b先还原到异或前的位置（可以将这一系列理解为操作倒置），然后与seed异或，原理是x^y^y=x。这样我们又得到了原有的那些位，再通过移位就可以得到解码后的答案：

int  decode(const  void*  raw_in,  void*  raw_out,  uint32_t  password,  size_t  len) 
{ 
  const  uint8_t*  in  =  (const  uint8_t*)raw_in; 
  uint8_t*  out  =  (uint8_t*)raw_out; 

  uint32_t  seed  =  password  ^  0x48879c19u; 
  for  (size_t  i  =  0  ;  i  <  len;  ++i)  { 
    //  请?在?此?处?补?全?代?码?
    uint8_t a = (in[i] << 4) ^ seed;
    uint8_t b = (((uint32_t)in[i]) << 7 ^ seed) >> 11;
    a &= 240;
    b &= 15;
    out[i] = a | b;
    seed  =  ((seed  ^  out[i])  *  144123481  +  out[i]); 
  } 
  return 0;
}

这是我第二次做测试的题目，前一次的测试我一直没有通过，那题与这题的差别只是a为前5位，b为后3位，seed的计算有些不同。可结果就是不对，我正对结果表示匪夷所思之际，弹框说我已经到时间了。于是重新登录，进行第二次测试。这次我继续用原有的decode代码，将数值按照这一版的encode替换掉，居然就通过了。再撤销代码回到第一次测试那题，检查了几番，结果依然不对。晚上再翻出代码来一看，原来第二次能通过纯属巧合，因为a和b各取了四位。

我错误的原因是，将a与b还原时，应该将a的后三位置0，将b的前5位置0，我却错误地继续使用之前的数值，导致a 的前3位置0，b的后5位置0了。看来是自己检查的还不够仔细。

这里还遇到一个情况就是VS的库中没有stdint.h，于是我只能去网上找了一个，贴在下面：

// ISO C9x  compliant stdint.h for Microsoft Visual Studio
// Based on ISO/IEC 9899:TC2 Committee draft (May 6, 2005) WG14/N1124 
// 
//  Copyright (c) 2006-2008 Alexander Chemeris
// 
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are met:
// 
//   1. Redistributions of source code must retain the above copyright notice,
//      this list of conditions and the following disclaimer.
// 
//   2. Redistributions in binary form must reproduce the above copyright
//      notice, this list of conditions and the following disclaimer in the
//      documentation and/or other materials provided with the distribution.
// 
//   3. The name of the author may be used to endorse or promote products
//      derived from this software without specific prior written permission.
// 
// THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR IMPLIED
// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO
// EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
// PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
// OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, 
// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
// OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
// ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
// 
///////////////////////////////////////////////////////////////////////////////

#ifndef _MSC_VER // [
#error "Use this header only with Microsoft Visual C++ compilers!"
#endif // _MSC_VER ]

#ifndef _MSC_STDINT_H_ // [
#define _MSC_STDINT_H_

#if _MSC_VER > 1000
#pragma once
#endif

#include <limits.h>

// For Visual Studio 6 in C++ mode and for many Visual Studio versions when
// compiling for ARM we should wrap <wchar.h> include with 'extern "C++" {}'
// or compiler give many errors like this:
//   error C2733: second C linkage of overloaded function 'wmemchr' not allowed
#ifdef __cplusplus
extern "C" {
#endif
#  include <wchar.h>
#ifdef __cplusplus
}
#endif

// Define _W64 macros to mark types changing their size, like intptr_t.
#ifndef _W64
#  if !defined(__midl) && (defined(_X86_) || defined(_M_IX86)) && _MSC_VER >= 1300
#     define _W64 __w64
#  else
#     define _W64
#  endif
#endif


// 7.18.1 Integer types

// 7.18.1.1 Exact-width integer types

// Visual Studio 6 and Embedded Visual C++ 4 doesn't
// realize that, e.g. char has the same size as __int8
// so we give up on __intX for them.
#if (_MSC_VER < 1300)
typedef signed char       int8_t;
typedef signed short      int16_t;
typedef signed int        int32_t;
typedef unsigned char     uint8_t;
typedef unsigned short    uint16_t;
typedef unsigned int      uint32_t;
#else
typedef signed __int8     int8_t;
typedef signed __int16    int16_t;
typedef signed __int32    int32_t;
typedef unsigned __int8   uint8_t;
typedef unsigned __int16  uint16_t;
typedef unsigned __int32  uint32_t;
#endif
typedef signed __int64       int64_t;
typedef unsigned __int64     uint64_t;


// 7.18.1.2 Minimum-width integer types
typedef int8_t    int_least8_t;
typedef int16_t   int_least16_t;
typedef int32_t   int_least32_t;
typedef int64_t   int_least64_t;
typedef uint8_t   uint_least8_t;
typedef uint16_t  uint_least16_t;
typedef uint32_t  uint_least32_t;
typedef uint64_t  uint_least64_t;

// 7.18.1.3 Fastest minimum-width integer types
typedef int8_t    int_fast8_t;
typedef int16_t   int_fast16_t;
typedef int32_t   int_fast32_t;
typedef int64_t   int_fast64_t;
typedef uint8_t   uint_fast8_t;
typedef uint16_t  uint_fast16_t;
typedef uint32_t  uint_fast32_t;
typedef uint64_t  uint_fast64_t;

// 7.18.1.4 Integer types capable of holding object pointers
#ifdef _WIN64 // [
typedef signed __int64    intptr_t;
typedef unsigned __int64  uintptr_t;
#else // _WIN64 ][
typedef _W64 signed int   intptr_t;
typedef _W64 unsigned int uintptr_t;
#endif // _WIN64 ]

// 7.18.1.5 Greatest-width integer types
typedef int64_t   intmax_t;
typedef uint64_t  uintmax_t;


// 7.18.2 Limits of specified-width integer types

#if !defined(__cplusplus) || defined(__STDC_LIMIT_MACROS) // [   See footnote 220 at page 257 and footnote 221 at page 259

// 7.18.2.1 Limits of exact-width integer types
#define INT8_MIN     ((int8_t)_I8_MIN)
#define INT8_MAX     _I8_MAX
#define INT16_MIN    ((int16_t)_I16_MIN)
#define INT16_MAX    _I16_MAX
#define INT32_MIN    ((int32_t)_I32_MIN)
#define INT32_MAX    _I32_MAX
#define INT64_MIN    ((int64_t)_I64_MIN)
#define INT64_MAX    _I64_MAX
#define UINT8_MAX    _UI8_MAX
#define UINT16_MAX   _UI16_MAX
#define UINT32_MAX   _UI32_MAX
#define UINT64_MAX   _UI64_MAX

// 7.18.2.2 Limits of minimum-width integer types
#define INT_LEAST8_MIN    INT8_MIN
#define INT_LEAST8_MAX    INT8_MAX
#define INT_LEAST16_MIN   INT16_MIN
#define INT_LEAST16_MAX   INT16_MAX
#define INT_LEAST32_MIN   INT32_MIN
#define INT_LEAST32_MAX   INT32_MAX
#define INT_LEAST64_MIN   INT64_MIN
#define INT_LEAST64_MAX   INT64_MAX
#define UINT_LEAST8_MAX   UINT8_MAX
#define UINT_LEAST16_MAX  UINT16_MAX
#define UINT_LEAST32_MAX  UINT32_MAX
#define UINT_LEAST64_MAX  UINT64_MAX

// 7.18.2.3 Limits of fastest minimum-width integer types
#define INT_FAST8_MIN    INT8_MIN
#define INT_FAST8_MAX    INT8_MAX
#define INT_FAST16_MIN   INT16_MIN
#define INT_FAST16_MAX   INT16_MAX
#define INT_FAST32_MIN   INT32_MIN
#define INT_FAST32_MAX   INT32_MAX
#define INT_FAST64_MIN   INT64_MIN
#define INT_FAST64_MAX   INT64_MAX
#define UINT_FAST8_MAX   UINT8_MAX
#define UINT_FAST16_MAX  UINT16_MAX
#define UINT_FAST32_MAX  UINT32_MAX
#define UINT_FAST64_MAX  UINT64_MAX

// 7.18.2.4 Limits of integer types capable of holding object pointers
#ifdef _WIN64 // [
#  define INTPTR_MIN   INT64_MIN
#  define INTPTR_MAX   INT64_MAX
#  define UINTPTR_MAX  UINT64_MAX
#else // _WIN64 ][
#  define INTPTR_MIN   INT32_MIN
#  define INTPTR_MAX   INT32_MAX
#  define UINTPTR_MAX  UINT32_MAX
#endif // _WIN64 ]

// 7.18.2.5 Limits of greatest-width integer types
#define INTMAX_MIN   INT64_MIN
#define INTMAX_MAX   INT64_MAX
#define UINTMAX_MAX  UINT64_MAX

// 7.18.3 Limits of other integer types

#ifdef _WIN64 // [
#  define PTRDIFF_MIN  _I64_MIN
#  define PTRDIFF_MAX  _I64_MAX
#else  // _WIN64 ][
#  define PTRDIFF_MIN  _I32_MIN
#  define PTRDIFF_MAX  _I32_MAX
#endif  // _WIN64 ]

#define SIG_ATOMIC_MIN  INT_MIN
#define SIG_ATOMIC_MAX  INT_MAX

#ifndef SIZE_MAX // [
#  ifdef _WIN64 // [
#     define SIZE_MAX  _UI64_MAX
#  else // _WIN64 ][
#     define SIZE_MAX  _UI32_MAX
#  endif // _WIN64 ]
#endif // SIZE_MAX ]

// WCHAR_MIN and WCHAR_MAX are also defined in <wchar.h>
#ifndef WCHAR_MIN // [
#  define WCHAR_MIN  0
#endif  // WCHAR_MIN ]
#ifndef WCHAR_MAX // [
#  define WCHAR_MAX  _UI16_MAX
#endif  // WCHAR_MAX ]

#define WINT_MIN  0
#define WINT_MAX  _UI16_MAX

#endif // __STDC_LIMIT_MACROS ]


// 7.18.4 Limits of other integer types

#if !defined(__cplusplus) || defined(__STDC_CONSTANT_MACROS) // [   See footnote 224 at page 260

// 7.18.4.1 Macros for minimum-width integer constants

#define INT8_C(val)  val##i8
#define INT16_C(val) val##i16
#define INT32_C(val) val##i32
#define INT64_C(val) val##i64

#define UINT8_C(val)  val##ui8
#define UINT16_C(val) val##ui16
#define UINT32_C(val) val##ui32
#define UINT64_C(val) val##ui64

// 7.18.4.2 Macros for greatest-width integer constants
#define INTMAX_C   INT64_C
#define UINTMAX_C  UINT64_C

#endif // __STDC_CONSTANT_MACROS ]


#endif // _MSC_STDINT_H_ ]

posted @ 2011-09-15 20:02 筱夏阅读(1874) 评论(4) 编辑收藏举报

亚特兰蒂斯の夏

搜狗的测试题，关于解码与编码

公告