/usr/include/htslib/bgzf.h is in libhts-dev 1.7-2.
This file is owned by root:root, with mode 0o644.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 | /// @file htslib/bgzf.h
/// Low-level routines for direct BGZF operations.
/*
Copyright (c) 2008 Broad Institute / Massachusetts Institute of Technology
2011, 2012 Attractive Chaos <attractor@live.co.uk>
Copyright (C) 2009, 2013, 2014,2017 Genome Research Ltd
Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the "Software"), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:
The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
*/
/* The BGZF library was originally written by Bob Handsaker from the Broad
* Institute. It was later improved by the SAMtools developers. */
#ifndef HTSLIB_BGZF_H
#define HTSLIB_BGZF_H
#include <stdint.h>
#include <stdio.h>
#include <zlib.h>
#include <sys/types.h>
#include "hts_defs.h"
#ifdef __cplusplus
extern "C" {
#endif
#define BGZF_BLOCK_SIZE 0xff00 // make sure compressBound(BGZF_BLOCK_SIZE) < BGZF_MAX_BLOCK_SIZE
#define BGZF_MAX_BLOCK_SIZE 0x10000
#define BGZF_ERR_ZLIB 1
#define BGZF_ERR_HEADER 2
#define BGZF_ERR_IO 4
#define BGZF_ERR_MISUSE 8
#define BGZF_ERR_MT 16 // stream cannot be multi-threaded
#define BGZF_ERR_CRC 32
struct hFILE;
struct hts_tpool;
struct bgzf_mtaux_t;
typedef struct __bgzidx_t bgzidx_t;
typedef struct bgzf_cache_t bgzf_cache_t;
struct BGZF {
// Reserved bits should be written as 0; read as "don't care"
unsigned errcode:16, reserved:1, is_write:1, no_eof_block:1, is_be:1;
signed compress_level:9;
unsigned last_block_eof:1, is_compressed:1, is_gzip:1;
int cache_size;
int block_length, block_clength, block_offset;
int64_t block_address, uncompressed_address;
void *uncompressed_block, *compressed_block;
bgzf_cache_t *cache;
struct hFILE *fp; // actual file handle
struct bgzf_mtaux_t *mt; // only used for multi-threading
bgzidx_t *idx; // BGZF index
int idx_build_otf; // build index on the fly, set by bgzf_index_build_init()
z_stream *gz_stream;// for gzip-compressed files
};
#ifndef HTS_BGZF_TYPEDEF
typedef struct BGZF BGZF;
#define HTS_BGZF_TYPEDEF
#endif
#ifndef KSTRING_T
#define KSTRING_T kstring_t
typedef struct __kstring_t {
size_t l, m;
char *s;
} kstring_t;
#endif
/******************
* Basic routines *
******************/
/**
* Open an existing file descriptor for reading or writing.
*
* @param fd file descriptor
* Note that the file must be opened in binary mode, or else
* there will be problems on platforms that make a difference
* between text and binary mode.
* @param mode mode matching /[rwag][u0-9]+/: 'r' for reading, 'w' for
* writing, 'a' for appending, 'g' for gzip rather than BGZF
* compression (with 'w' only), and digit specifies the zlib
* compression level.
* Note that there is a distinction between 'u' and '0': the
* first yields plain uncompressed output whereas the latter
* outputs uncompressed data wrapped in the zlib format.
* @return BGZF file handler; 0 on error
*/
BGZF* bgzf_dopen(int fd, const char *mode);
#define bgzf_fdopen(fd, mode) bgzf_dopen((fd), (mode)) // for backward compatibility
/**
* Open the specified file for reading or writing.
*/
BGZF* bgzf_open(const char* path, const char *mode);
/**
* Open an existing hFILE stream for reading or writing.
*/
BGZF* bgzf_hopen(struct hFILE *fp, const char *mode);
/**
* Close the BGZF and free all associated resources.
*
* @param fp BGZF file handler
* @return 0 on success and -1 on error
*/
int bgzf_close(BGZF *fp);
/**
* Read up to _length_ bytes from the file storing into _data_.
*
* @param fp BGZF file handler
* @param data data array to read into
* @param length size of data to read
* @return number of bytes actually read; 0 on end-of-file and -1 on error
*/
ssize_t bgzf_read(BGZF *fp, void *data, size_t length) HTS_RESULT_USED;
/**
* Write _length_ bytes from _data_ to the file. If no I/O errors occur,
* the complete _length_ bytes will be written (or queued for writing).
*
* @param fp BGZF file handler
* @param data data array to write
* @param length size of data to write
* @return number of bytes written (i.e., _length_); negative on error
*/
ssize_t bgzf_write(BGZF *fp, const void *data, size_t length) HTS_RESULT_USED;
/**
* Write _length_ bytes from _data_ to the file, the index will be used to
* decide the amount of uncompressed data to be writen to each bgzip block.
* If no I/O errors occur, the complete _length_ bytes will be written (or
* queued for writing).
* @param fp BGZF file handler
* @param data data array to write
* @param length size of data to write
* @return number of bytes written (i.e., _length_); negative on error
*/
ssize_t bgzf_block_write(BGZF *fp, const void *data, size_t length);
/**
* Read up to _length_ bytes directly from the underlying stream without
* decompressing. Bypasses BGZF blocking, so must be used with care in
* specialised circumstances only.
*
* @param fp BGZF file handler
* @param data data array to read into
* @param length number of raw bytes to read
* @return number of bytes actually read; 0 on end-of-file and -1 on error
*/
ssize_t bgzf_raw_read(BGZF *fp, void *data, size_t length) HTS_RESULT_USED;
/**
* Write _length_ bytes directly to the underlying stream without
* compressing. Bypasses BGZF blocking, so must be used with care
* in specialised circumstances only.
*
* @param fp BGZF file handler
* @param data data array to write
* @param length number of raw bytes to write
* @return number of bytes actually written; -1 on error
*/
ssize_t bgzf_raw_write(BGZF *fp, const void *data, size_t length) HTS_RESULT_USED;
/**
* Write the data in the buffer to the file.
*
* @param fp BGZF file handle
* @return 0 on success and -1 on error
*/
int bgzf_flush(BGZF *fp) HTS_RESULT_USED;
/**
* Return a virtual file pointer to the current location in the file.
* No interpretation of the value should be made, other than a subsequent
* call to bgzf_seek can be used to position the file at the same point.
* Return value is non-negative on success.
*/
#define bgzf_tell(fp) (((fp)->block_address << 16) | ((fp)->block_offset & 0xFFFF))
/**
* Set the file to read from the location specified by _pos_.
*
* @param fp BGZF file handler
* @param pos virtual file offset returned by bgzf_tell()
* @param whence must be SEEK_SET
* @return 0 on success and -1 on error
*/
int64_t bgzf_seek(BGZF *fp, int64_t pos, int whence) HTS_RESULT_USED;
/**
* Check if the BGZF end-of-file (EOF) marker is present
*
* @param fp BGZF file handler opened for reading
* @return 1 if the EOF marker is present and correct;
* 2 if it can't be checked, e.g., because fp isn't seekable;
* 0 if the EOF marker is absent;
* -1 (with errno set) on error
*/
int bgzf_check_EOF(BGZF *fp);
/** Return the file's compression format
*
* @param fp BGZF file handle
* @return A small integer matching the corresponding
* `enum htsCompression` value:
* - 0 / `no_compression` if the file is uncompressed
* - 1 / `gzip` if the file is plain GZIP-compressed
* - 2 / `bgzf` if the file is BGZF-compressed
* @since 1.4
*/
int bgzf_compression(BGZF *fp);
/**
* Check if a file is in the BGZF format
*
* @param fn file name
* @return 1 if _fn_ is BGZF; 0 if not or on I/O error
*/
int bgzf_is_bgzf(const char *fn) HTS_DEPRECATED("Use bgzf_compression() or hts_detect_format() instead");
/*********************
* Advanced routines *
*********************/
/**
* Set the cache size. Only effective when compiled with -DBGZF_CACHE.
*
* @param fp BGZF file handler
* @param size size of cache in bytes; 0 to disable caching (default)
*/
void bgzf_set_cache_size(BGZF *fp, int size);
/**
* Flush the file if the remaining buffer size is smaller than _size_
* @return 0 if flushing succeeded or was not needed; negative on error
*/
int bgzf_flush_try(BGZF *fp, ssize_t size) HTS_RESULT_USED;
/**
* Read one byte from a BGZF file. It is faster than bgzf_read()
* @param fp BGZF file handler
* @return byte read; -1 on end-of-file or error
*/
int bgzf_getc(BGZF *fp);
/**
* Read one line from a BGZF file. It is faster than bgzf_getc()
*
* @param fp BGZF file handler
* @param delim delimitor
* @param str string to write to; must be initialized
* @return length of the string; -1 on end-of-file; <= -2 on error
*/
int bgzf_getline(BGZF *fp, int delim, kstring_t *str);
/**
* Read the next BGZF block.
*/
int bgzf_read_block(BGZF *fp) HTS_RESULT_USED;
/**
* Enable multi-threading (when compiled with -DBGZF_MT) via a shared
* thread pool. This means both encoder and decoder can balance
* usage across a single pool of worker jobs.
*
* @param fp BGZF file handler; must be opened for writing
* @param pool The thread pool (see hts_create_threads)
*/
int bgzf_thread_pool(BGZF *fp, struct hts_tpool *pool, int qsize);
/**
* Enable multi-threading (only effective when the library was compiled
* with -DBGZF_MT)
*
* @param fp BGZF file handler; must be opened for writing
* @param n_threads #threads used for writing
* @param n_sub_blks #blocks processed by each thread; a value 64-256 is recommended
*/
int bgzf_mt(BGZF *fp, int n_threads, int n_sub_blks);
/**
* Compress a single BGZF block.
*
* @param dst output buffer (must have size >= BGZF_MAX_BLOCK_SIZE)
* @param dlen size of output buffer; updated on return to the number
* of bytes actually written to dst
* @param src buffer to be compressed
* @param slen size of data to compress (must be <= BGZF_BLOCK_SIZE)
* @param level compression level
* @return 0 on success and negative on error
*/
int bgzf_compress(void *dst, size_t *dlen, const void *src, size_t slen, int level);
/*******************
* bgzidx routines *
*******************/
/**
* Position BGZF at the uncompressed offset
*
* @param fp BGZF file handler; must be opened for reading
* @param uoffset file offset in the uncompressed data
* @param where SEEK_SET supported atm
*
* Returns 0 on success and -1 on error.
*/
int bgzf_useek(BGZF *fp, long uoffset, int where) HTS_RESULT_USED;
/**
* Position in uncompressed BGZF
*
* @param fp BGZF file handler; must be opened for reading
*
* Returns the current offset on success and -1 on error.
*/
long bgzf_utell(BGZF *fp);
/**
* Tell BGZF to build index while compressing.
*
* @param fp BGZF file handler; can be opened for reading or writing.
*
* Returns 0 on success and -1 on error.
*/
int bgzf_index_build_init(BGZF *fp);
/// Load BGZF index
/**
* @param fp BGZF file handler
* @param bname base name
* @param suffix suffix to add to bname (can be NULL)
* @return 0 on success and -1 on error.
*/
int bgzf_index_load(BGZF *fp,
const char *bname, const char *suffix) HTS_RESULT_USED;
/// Load BGZF index from an hFILE
/**
* @param fp BGZF file handle
* @param idx hFILE to read from
* @param name file name (for error reporting only; can be NULL)
* @return 0 on success and -1 on error.
*
* Populates @p fp with index data read from the hFILE handle @p idx.
* The file pointer to @idx should point to the start of the index
* data when this function is called.
*
* The file name can optionally be passed in the @p name parameter. This
* is only used for printing error messages; if NULL the word "index" is
* used instead.
*/
int bgzf_index_load_hfile(BGZF *fp, struct hFILE *idx,
const char *name) HTS_RESULT_USED;
/// Save BGZF index
/**
* @param fp BGZF file handler
* @param bname base name
* @param suffix suffix to add to bname (can be NULL)
* @return 0 on success and -1 on error.
*/
int bgzf_index_dump(BGZF *fp,
const char *bname, const char *suffix) HTS_RESULT_USED;
/// Write a BGZF index to an hFILE
/**
* @param fp BGZF file handle
* @param idx hFILE to write to
* @param name file name (for error reporting only, can be NULL)
* @return 0 on success and -1 on error.
*
* Write index data from @p fp to the file @p idx.
*
* The file name can optionally be passed in the @p name parameter. This
* is only used for printing error messages; if NULL the word "index" is
* used instead.
*/
int bgzf_index_dump_hfile(BGZF *fp, struct hFILE *idx,
const char *name) HTS_RESULT_USED;
#ifdef __cplusplus
}
#endif
#endif
|