BigQuery用户定义函数中的Base64编码

时间:2017-06-29 23:02:27

标签: javascript base64 google-bigquery user-defined-functions

BigQuery使用Javascript作为其用户定义的函数。 BigQuery中BYTES的输入和输出与Javascript中的base64编码字符串进行映射。

BigQuery没有浏览器window对象,因此缺少atobbtoa。在Bigquery JS环境中是否有一种简单的编码和解码方法,或者你是否必须包含一个库来进行映射?

1 个答案:

答案 0 :(得分:3)

您需要包含一个库,但是一旦将JavaScript引入云存储,它就会非常简单,您可以将此方法用于您要导入的其他公共库。我在a StackOverflow post中找到了一个实现,并将这些内容放在名为.idea的文件中:

btoa_atob.js

然后我将文件复制到我的云端存储:

(function () {
  var chars = 'ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/=';

  function InvalidCharacterError(message) {
    this.message = message;
  }
  InvalidCharacterError.prototype = new Error;
  InvalidCharacterError.prototype.name = 'InvalidCharacterError';

  // encoder                                                                                                                                                                                                                                                                              
  // [https://gist.github.com/999166] by [https://github.com/nignag]                                                                                                                                                                                                                      
  btoa = function (input) {
    var str = String(input);
    for (
      // initialize result and counter                                                                                                                                                                                                                                                    
      var block, charCode, idx = 0, map = chars, output = '';
      // if the next str index does not exist:                                                                                                                                                                                                                                            
      //   change the mapping table to "="                                                                                                                                                                                                                                                
      //   check if d has no fractional digits                                                                                                                                                                                                                                            
      str.charAt(idx | 0) || (map = '=', idx % 1);
      // "8 - idx % 1 * 8" generates the sequence 2, 4, 6, 8                                                                                                                                                                                                                              
      output += map.charAt(63 & block >> 8 - idx % 1 * 8)
    ) {
      charCode = str.charCodeAt(idx += 3/4);
      if (charCode > 0xFF) {
        throw new InvalidCharacterError("'btoa' failed: The string to be encoded contains characters outside of the Latin1 range.");
      }
      block = block << 8 | charCode;
    }
    return output;
  };

  // decoder                                                                                                                                                                                                                                                                              
  // [https://gist.github.com/1020396] by [https://github.com/atk]                                                                                                                                                                                                                        
  atob = function (input) {
    var str = String(input).replace(/[=]+$/, ''); // #31: ExtendScript bad parse of /=                                                                                                                                                                                                    
    if (str.length % 4 == 1) {
      throw new InvalidCharacterError("'atob' failed: The string to be decoded is not correctly encoded.");
    }
    for (
      // initialize result and counters                                                                                                                                                                                                                                                   
      var bc = 0, bs, buffer, idx = 0, output = '';
      // get next character                                                                                                                                                                                                                                                               
      buffer = str.charAt(idx++);
      // character found in table? initialize bit storage and add its ascii value;                                                                                                                                                                                                        
      ~buffer && (bs = bc % 4 ? bs * 64 + buffer : buffer,
        // and if not first of each 4 characters,                                                                                                                                                                                                                                         
        // convert the first 8 bits to one ascii character                                                                                                                                                                                                                                
        bc++ % 4) ? output += String.fromCharCode(255 & bs >> (-2 * bc & 6)) : 0
    ) {
      // try to find character in table (0-63, not found => -1)                                                                                                                                                                                                                           
      buffer = chars.indexOf(buffer);
    }
    return output;
  };

}());

然后我写了一个使用它的虚函数:

gsutil cp btoa_atob.js gs://my-bucket/