-
Notifications
You must be signed in to change notification settings - Fork 225
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
* change default cache behavior in search_disk_index; scale factors in float to int8 * added int8_to_float_scale file
- Loading branch information
1 parent
3e7d511
commit 10c1b3a
Showing
4 changed files
with
75 additions
and
4 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,62 @@ | ||
// Copyright (c) Microsoft Corporation. All rights reserved. | ||
// Licensed under the MIT license. | ||
|
||
#include <iostream> | ||
#include "utils.h" | ||
|
||
void block_convert(std::ofstream& writer, float* write_buf, | ||
std::ifstream& reader, int8_t* read_buf, _u64 npts, | ||
_u64 ndims, float bias, float scale) { | ||
reader.read((char*) read_buf, npts * ndims * sizeof(int8_t)); | ||
|
||
for (_u64 i = 0; i < npts; i++) { | ||
for (_u64 d = 0; d < ndims; d++) { | ||
write_buf[d + i * ndims] = | ||
(((float)read_buf[d + i * ndims] - bias) * scale); | ||
} | ||
} | ||
writer.write((char*) write_buf, npts * ndims * sizeof(float)); | ||
} | ||
|
||
int main(int argc, char** argv) { | ||
if (argc != 5) { | ||
std::cout << "Usage: " << argv[0] << " input-int8.bin output-float.bin bias scale" | ||
<< std::endl; | ||
exit(-1); | ||
} | ||
|
||
std::ifstream reader(argv[1], std::ios::binary); | ||
_u32 npts_u32; | ||
_u32 ndims_u32; | ||
reader.read((char*) &npts_u32, sizeof(_s32)); | ||
reader.read((char*) &ndims_u32, sizeof(_s32)); | ||
size_t npts = npts_u32; | ||
size_t ndims = ndims_u32; | ||
std::cout << "Dataset: #pts = " << npts << ", # dims = " << ndims | ||
<< std::endl; | ||
|
||
_u64 blk_size = 131072; | ||
_u64 nblks = ROUND_UP(npts, blk_size) / blk_size; | ||
|
||
std::ofstream writer(argv[2], std::ios::binary); | ||
auto read_buf = new int8_t[blk_size * ndims]; | ||
auto write_buf = new float[blk_size * ndims]; | ||
float bias = atof(argv[3]); | ||
float scale = atof(argv[4]); | ||
|
||
writer.write((char*) (&npts_u32), sizeof(_u32)); | ||
writer.write((char*) (&ndims_u32), sizeof(_u32)); | ||
|
||
for (_u64 i = 0; i < nblks; i++) { | ||
_u64 cblk_size = std::min(npts - i * blk_size, blk_size); | ||
block_convert(writer, write_buf, reader, read_buf, cblk_size, ndims, bias, | ||
scale); | ||
std::cout << "Block #" << i << " written" << std::endl; | ||
} | ||
|
||
delete[] read_buf; | ||
delete[] write_buf; | ||
|
||
writer.close(); | ||
reader.close(); | ||
} |