tfrecords

tfrecords: simplify and transplant the tfrecords

These details have not been verified by PyPI

Project links

Homepage

GitHub Statistics

View statistics for this project via Libraries.io, or by using our public dataset on Google BigQuery

Project description

tfrecords

simplify and transplant the tfrecord and table

update information

    2022-10-30:  Add lmdb leveldb read and writer and add record batch write
    2022-10-17:  Add shared memory for record to read mode with more accelerated Reading.
    2022-02-01:  simplify and transplant the tfrecord dataset

1. record read and write demo , with_share_memory flags will Accelerated Reading

# -*- coding: utf-8 -*-
# @Time    : 2022/9/8 15:49

import tfrecords
options = tfrecords.TFRecordOptions(compression_type=tfrecords.TFRecordCompressionType.NONE)
def test_write(filename, N=3, context='aaa'):
    with tfrecords.TFRecordWriter(filename, options=options) as file_writer:
        batch_data = []
        for i in range(N):
            d = context + '____' + str(i)
            batch_data.append(d)
            if (i + 1) % 100 == 0:
                file_writer.write_batch(batch_data)
                batch_data.clear()
        if len(batch_data):
            file_writer.write_batch(batch_data)
            batch_data.clear()

def test_record_iterator(example_paths):
    print('test_record_iterator')
    for example_path in example_paths:
        iterator = tfrecords.tf_record_iterator(example_path, options=options,skip_bytes=0,with_share_memory=True)
        offset_list = iterator.read_offsets(0)
        count = iterator.read_count(0)
        print(count)
        num = 0
        for iter in iterator:
            num += 1
            print(iter)

def test_random_reader(example_paths):
    print('test_random_reader')
    for example_path in example_paths:
        file_reader = tfrecords.tf_record_random_reader(example_path, options=options,with_share_memory=True)
        last_pos = 0
        while True:
            try:
                x,pos = file_reader.read(last_pos)
                print(x,pos)
                last_pos = pos

            except Exception as e:
                break

def test_random_reader2(example_paths):
    print('test_random_reader2')
    for example_path in example_paths:
        file_reader = tfrecords.tf_record_random_reader(example_path, options=options,with_share_memory=True)
        skip_bytes = 0
        offset_list = file_reader.read_offsets(skip_bytes)
        for offset,length in offset_list:
            x, _ = file_reader.read(offset)
            print(x)

test_write('d:/example.tfrecords0',3,'file0')

example_paths = tfrecords.glob('d:/example.tfrecords*')
print(example_paths)
test_record_iterator(example_paths)
print()
test_random_reader(example_paths)
print()
test_random_reader2(example_paths)
print()

2. leveldb read and write demo

# -*- coding: utf-8 -*-
# @Time    : 2022/9/8 15:49

from tfrecords import LEVELDB
db_path = 'd:/example_leveldb'
def test_write(db_path):
    options = LEVELDB.LeveldbOptions(create_if_missing=True, error_if_exists=False)
    file_writer = LEVELDB.Leveldb(db_path,options)

    keys,values = [],[]
    for i in range(30):
        keys.append(b"input_" + str(i).encode())
        keys.append(b"label_" + str(i).encode())
        values.append(b"xiaoming" + str(i).encode())
        values.append(b"zzs" + str(i).encode())
        if (i + 1) % 1000 == 0:
            file_writer.put_batch(keys,values)
            keys.clear()
            values.clear()
    if len(keys):
        file_writer.put_batch(keys, values)
        keys.clear()
        values.clear()

    file_writer.close()
def test_read(db_path):
    options = LEVELDB.LeveldbOptions(create_if_missing=False, error_if_exists=False)
    reader = LEVELDB.Leveldb(db_path,options)

    def show():
        it = reader.get_iterater(reverse=False)
        i = 0
        for item in it:
            print(i,item)
            i += 1

    def test_find(key):
        value = reader.get(key)
        print('find', type(value), value)

    show()

    test_find(b'input_0')
    test_find(b'input_5')
    test_find(b'input_10')

    reader.close()

test_write(db_path)
test_read(db_path)

3. lmdb read and write demo

# -*- coding: utf-8 -*-
# @Time    : 2022/9/8 15:49

from tfrecords import LMDB
db_path = 'd:/example_lmdb'
def test_write(db_path):
    options = LMDB.LmdbOptions(env_open_flag = 0,
                env_open_mode = 0o664, # 8进制表示
                txn_flag = 0,
                dbi_flag = 0,
                put_flag = 0)
    file_writer = LMDB.Lmdb(db_path,options,map_size=1024 * 1024 * 10)
    keys, values = [], []
    for i in range(30):
        keys.append(b"input_" + str(i).encode())
        keys.append(b"label_" + str(i).encode())
        values.append(b"xiaoming_" + str(i).encode())
        values.append(b"zzs_" + str(i).encode())
        if (i + 1) % 1000 == 0:
            file_writer.put_batch(keys, values)
            keys.clear()
            values.clear()
    if len(keys):
        file_writer.put_batch(keys, values)
    file_writer.close()
def test_read(db_path):
    options = LMDB.LmdbOptions( env_open_flag = LMDB.LmdbFlag.MDB_RDONLY,
                env_open_mode = 0o664, # 8进制表示
                txn_flag = 0,
                dbi_flag = 0,
                put_flag = 0)
    reader = LMDB.Lmdb(db_path,options,map_size=0)

    def show():
        it = reader.get_iterater(reverse=False)
        i = 0
        for item in it:
            print(i,item)
            i += 1


    def test_find(key):
        value = reader.get(key)
        print('find', type(value), value)

    show()
    test_find('input0')
    test_find('input5')
    test_find(b'input10')
    reader.close()

test_write(db_path)
test_read(db_path)

Project details

These details have not been verified by PyPI

Project links

Homepage

GitHub Statistics

View statistics for this project via Libraries.io, or by using our public dataset on Google BigQuery

Release history Release notifications | RSS feed

0.2.19

Mar 25, 2024

0.2.17

Nov 11, 2023

0.2.16

Oct 28, 2023

0.2.15

Aug 13, 2023

0.2.14

Jul 8, 2023

0.2.13

Jul 6, 2023

0.2.12

Jul 6, 2023

0.2.11

Jul 3, 2023

0.2.9

Jul 2, 2023

0.2.6

Apr 27, 2023

0.2.5

Apr 2, 2023

This version

0.2.4

Dec 15, 2022

0.2.3

Dec 13, 2022

0.2.2

Nov 4, 2022

0.2.1

Oct 31, 2022

0.0.8

Oct 17, 2022

0.0.4

Sep 21, 2022

Download files

Download the file for your platform. If you're not sure which to choose, learn more about installing packages.

Source Distributions

No source distribution files available for this release.See tutorial on generating distribution archives.

Built Distributions

tfrecords-0.2.4-cp310-cp310-win_amd64.whl (1.1 MB view hashes)

Uploaded Dec 15, 2022 CPython 3.10 Windows x86-64

tfrecords-0.2.4-cp310-cp310-manylinux2014_x86_64.whl (2.5 MB view hashes)

Uploaded Dec 15, 2022 CPython 3.10

tfrecords-0.2.4-cp310-cp310-manylinux2014_aarch64.whl (2.4 MB view hashes)

Uploaded Dec 15, 2022 CPython 3.10

tfrecords-0.2.4-cp39-cp39-win_amd64.whl (1.1 MB view hashes)

Uploaded Dec 15, 2022 CPython 3.9 Windows x86-64

tfrecords-0.2.4-cp39-cp39-manylinux2014_x86_64.whl (2.5 MB view hashes)

Uploaded Dec 15, 2022 CPython 3.9

tfrecords-0.2.4-cp39-cp39-manylinux2014_aarch64.whl (2.4 MB view hashes)

Uploaded Dec 15, 2022 CPython 3.9

tfrecords-0.2.4-cp38-cp38-win_amd64.whl (1.1 MB view hashes)

Uploaded Dec 15, 2022 CPython 3.8 Windows x86-64

tfrecords-0.2.4-cp38-cp38-manylinux2014_x86_64.whl (2.5 MB view hashes)

Uploaded Dec 15, 2022 CPython 3.8

tfrecords-0.2.4-cp38-cp38-manylinux2014_aarch64.whl (2.4 MB view hashes)

Uploaded Dec 15, 2022 CPython 3.8

tfrecords-0.2.4-cp37-cp37m-win_amd64.whl (1.1 MB view hashes)

Uploaded Dec 15, 2022 CPython 3.7m Windows x86-64

tfrecords-0.2.4-cp37-cp37m-manylinux2014_x86_64.whl (2.5 MB view hashes)

Uploaded Dec 15, 2022 CPython 3.7m

tfrecords-0.2.4-cp37-cp37m-manylinux2014_aarch64.whl (2.4 MB view hashes)

Uploaded Dec 15, 2022 CPython 3.7m

tfrecords-0.2.4-cp36-cp36m-win_amd64.whl (1.1 MB view hashes)

Uploaded Dec 15, 2022 CPython 3.6m Windows x86-64

tfrecords-0.2.4-cp36-cp36m-manylinux2014_x86_64.whl (2.5 MB view hashes)

Uploaded Dec 15, 2022 CPython 3.6m

tfrecords-0.2.4-cp36-cp36m-manylinux2014_aarch64.whl (2.4 MB view hashes)

Uploaded Dec 15, 2022 CPython 3.6m

Hashes for tfrecords-0.2.4-cp310-cp310-win_amd64.whl

Hashes for tfrecords-0.2.4-cp310-cp310-win_amd64.whl
Algorithm	Hash digest
SHA256	`f979aa2ab26006a05982a25c2f31bd9e35675a3c37343306f961042f1f4af504`
MD5	`9d6979dcabba92f467549ff67fa161d4`
BLAKE2b-256	`2f2ba8713499d29a5a670708b9f2500f825822294cdf46ab3512bb357a54d887`

Hashes for tfrecords-0.2.4-cp310-cp310-manylinux2014_x86_64.whl

Hashes for tfrecords-0.2.4-cp310-cp310-manylinux2014_x86_64.whl
Algorithm	Hash digest
SHA256	`5ac553ad1585dcf5dc0ec79befc28e1e783c064eb6465a483da4f10dc31c19fe`
MD5	`580da35b35dc138dd26de3839ee372f6`
BLAKE2b-256	`120da1954b432278590a77fce377bbeb261267839d3e455123c4af53a27cf8b7`

Hashes for tfrecords-0.2.4-cp310-cp310-manylinux2014_aarch64.whl

Hashes for tfrecords-0.2.4-cp310-cp310-manylinux2014_aarch64.whl
Algorithm	Hash digest
SHA256	`93a04c1b9113c1ef8c9a35e600dcb58b12d47eb71ef2edf25f165cbdf94e8d2c`
MD5	`77dca678889858ae85d75f5257a93e28`
BLAKE2b-256	`b070c5fe2869fe44a06f94e1f5013757975a2583ab9ada4b2a0fe9c542e33d4d`

Hashes for tfrecords-0.2.4-cp39-cp39-win_amd64.whl

Hashes for tfrecords-0.2.4-cp39-cp39-win_amd64.whl
Algorithm	Hash digest
SHA256	`669155eb28858d8db43c9cf0b125494e98c5dfe93515e86bc4d2fc78d670c7a7`
MD5	`5816b77ca0b026f3eb58bd725c4eadb2`
BLAKE2b-256	`637c5ebd682b3b52c27b527a7287509e07df0b79598fa5cf7916cfbe8e56b302`

Hashes for tfrecords-0.2.4-cp39-cp39-manylinux2014_x86_64.whl

Hashes for tfrecords-0.2.4-cp39-cp39-manylinux2014_x86_64.whl
Algorithm	Hash digest
SHA256	`45bcd8fcd43cd450d1c610a5455a508103b9f9edfe5676d82b289569def7d30a`
MD5	`b105acfb6911893810c5e122a1bbcaaf`
BLAKE2b-256	`f969373394b9109ed273b23425d6c5683aa0de1fa90595b52edc6d65d26cfcb0`

Hashes for tfrecords-0.2.4-cp39-cp39-manylinux2014_aarch64.whl

Hashes for tfrecords-0.2.4-cp39-cp39-manylinux2014_aarch64.whl
Algorithm	Hash digest
SHA256	`5be5d8f70eb7febc3ea41a5022b659a6f547943e386f0cb8f7454db7c54407dd`
MD5	`b56d96c9daa698bd16beab1567ba1ff1`
BLAKE2b-256	`b84b1b220bb82466a2c872db924168b8cbbf677940c67ad7a47afa098155453c`

Hashes for tfrecords-0.2.4-cp38-cp38-win_amd64.whl

Hashes for tfrecords-0.2.4-cp38-cp38-win_amd64.whl
Algorithm	Hash digest
SHA256	`c152c8506264e1f89c225c4f11bb2d984c4809fc3ecdb68670066bdf8f40211f`
MD5	`aa8f0747fa6053cd4d5398428f06b4a1`
BLAKE2b-256	`fb487f616185a0b284f3fa1b8a0ee79b86a967fcc9e09e1c5a9d890c4d297d00`

Hashes for tfrecords-0.2.4-cp38-cp38-manylinux2014_x86_64.whl

Hashes for tfrecords-0.2.4-cp38-cp38-manylinux2014_x86_64.whl
Algorithm	Hash digest
SHA256	`6e3511d1f8013836a06e125f4d979a5dcc84aa94b4ec80c35ee217501fc23b20`
MD5	`4c771f6ffaca2d37ac813de03425d12f`
BLAKE2b-256	`5cce143bb0497b3d9b18343e3a00c45168342618f02ef2873c28cff4302685d3`

Hashes for tfrecords-0.2.4-cp38-cp38-manylinux2014_aarch64.whl

Hashes for tfrecords-0.2.4-cp38-cp38-manylinux2014_aarch64.whl
Algorithm	Hash digest
SHA256	`6da23c03cb73065220de782958d9b2388f0a4e1fc0f8faf421045391e4fbd8c9`
MD5	`f53040a02bf5eea5afe710cf94e6cbd3`
BLAKE2b-256	`c331c3980f6eba21370b6f3069b40f0e36c7b9e06c9741594fef863efb6f6890`

Hashes for tfrecords-0.2.4-cp37-cp37m-win_amd64.whl

Hashes for tfrecords-0.2.4-cp37-cp37m-win_amd64.whl
Algorithm	Hash digest
SHA256	`23f61c9d524297841fc0ea24050de25051ac9fabd7113c599f8e6276c5d307b6`
MD5	`d293550d93d998de8e9b1e16f7ca84fc`
BLAKE2b-256	`89c114a774a51878c8bceb51cc7eaee5cd792eacc4f8ebec8b22217857bbc18c`

Hashes for tfrecords-0.2.4-cp37-cp37m-manylinux2014_x86_64.whl

Hashes for tfrecords-0.2.4-cp37-cp37m-manylinux2014_x86_64.whl
Algorithm	Hash digest
SHA256	`cff4c29e9b3d094c729c4aecb00a51f757feadab0b952143c830dc18c6d0c76a`
MD5	`15be0431a44432d711ef77ee2aa1e58f`
BLAKE2b-256	`4bd867124a0c500f8849cf99f7b487e7ca50c19e13f33ef499adf7df86dff00e`

Hashes for tfrecords-0.2.4-cp37-cp37m-manylinux2014_aarch64.whl

Hashes for tfrecords-0.2.4-cp37-cp37m-manylinux2014_aarch64.whl
Algorithm	Hash digest
SHA256	`aa1661e1e48d0dc07cb2b05dedf0e362b2c4d86bdee6e66bb74e880f9caf4aa2`
MD5	`8086564e3474e9bebbb74cf1b32f6be6`
BLAKE2b-256	`e03c7362bdfa5a6bf275ec65eaa307bd7791feca4986ad642af1c68d54f056f2`

Hashes for tfrecords-0.2.4-cp36-cp36m-win_amd64.whl

Hashes for tfrecords-0.2.4-cp36-cp36m-win_amd64.whl
Algorithm	Hash digest
SHA256	`7ed1ca0ba7ba3062056d183328c39daf715b928c84fde25be2f515008f8a5244`
MD5	`b27b730107eddc2bac229cdcd8fe260e`
BLAKE2b-256	`6036bc4eac734ca474427b2d7dee691832609c7a39c1563fc0d99142d4032f07`

Hashes for tfrecords-0.2.4-cp36-cp36m-manylinux2014_x86_64.whl

Hashes for tfrecords-0.2.4-cp36-cp36m-manylinux2014_x86_64.whl
Algorithm	Hash digest
SHA256	`2e3a716eaa3220f7adb9ce38c528f9c53fa3d404dd12425a0dc08508fcedde58`
MD5	`155bd08c25193880998ed3249eeadfd9`
BLAKE2b-256	`6f07c2fc3611f28c920ef4d1ef9fc8985b6f42df489c19efbc645dd37dc2987b`

Hashes for tfrecords-0.2.4-cp36-cp36m-manylinux2014_aarch64.whl

Hashes for tfrecords-0.2.4-cp36-cp36m-manylinux2014_aarch64.whl
Algorithm	Hash digest
SHA256	`107cc6f2003c22c41e4fab8f73d0dc8d1768ec8b362c2bc07febc1bcc578269b`
MD5	`e78c0a6b14f055720feed7d8ed57bb57`
BLAKE2b-256	`5129d16f89c2641a6b6e95d97ae09f1787478ba69868da8ff68a2b6f3dff8d3e`