Mar 23, 2009
by
pauln
Both this and the one below look to be caused by the reentrancy problem fixed in Zest about 2 weeks ago.
[root@castor mount_slash]# fg
PSC_LOG_LEVEL=2 SLASH_MDS_NID="128.182.58.80@tcp10" LNET_NETWORKS="tcp10(eth1)" USOCK_CPORT=1300 gdb ./mount_slash
#0 0x0000000000404e0c in atomic_dec (v=0x28)
at ..//..//psc_fsutil_libs/include/psc_util/atomic.h:393
#1 0x000000000040531a in slash2fuse_access (req=0x7fafb0, ino=15294024,
mask=1) at main.c:229
#2 0x0000000000403ee2 in slash2fuse_listener_loop (arg=0x0)
at fuse_listener.c:260
#3 0x0000003e8ce073da in start_thread () from /lib64/libpthread.so.0
#4 0x0000003e8c2e62bd in clone () from /lib64/libc.so.6
(gdb) up
#1 0x000000000040531a in slash2fuse_access (req=0x7fafb0, ino=15294024,
mask=1) at main.c:229
229 fidc_membh_dropref(c);
(gdb) print *c
Cannot access memory at address 0x0
(gdb)
Mar 20, 2009
by
pauln
Here are some changes I had to make for building on Fedora Core 10.
Note that a symlink was made in /usr/src/kernels.
(psc@castor:projects)$ ls -al /usr/src/kernels/slash2-devel-kernel
lrwxrwxrwx 1 root root 30 Mar 20 13:04 /usr/src/kernels/slash2-devel-kernel -> 2.6.27.19-170.2.35.fc10.x86_64/
Index: psc_fsutil_libs/include/psc_util/atomic.h
===================================================================
--- psc_fsutil_libs/include/psc_util/atomic.h (revision 5643)
+++ psc_fsutil_libs/include/psc_util/atomic.h (working copy)
@@ -3,9 +3,12 @@
#ifndef _PFL_ATOMIC_H_
#define _PFL_ATOMIC_H_
+#include "psc_types.h"
#include <sys/types.h>
-#include <asm/bitops.h>
-#include <asm/system.h>
+#include <asm/types.h>
+//#include <linux/bitops.h>
+//#include <asm/system.h>
+#include <asm/cmpxchg.h>
#include
Mar 5, 2009
by
pauln
wolverine (128.182.58.80) is configured as a SLASH2 metadata server.
Below is a dump of the ZFS configuration:
(pauln@wolverine:zpool)$ sudo ./zpool status
pool: wolverine_pool
state: ONLINE
scrub: none requested
config:
NAME STATE READ WRITE CKSUM
wolverine_pool ONLINE 0 0 0
raidz1 ONLINE 0 0 0
sdb1 ONLINE 0 0 0
sdc1 ONLINE 0 0 0
sdd1 ONLINE 0 0 0
errors: No known data errors
To date I’ve been able to successfully run a 10 million file create test (and unlink).
Here’s the fio test config:
group 8peReadWrite {
files_per_dir = 1024;
tree_depth = 8;
tree_width = 3;
pes = 4;
test_freq = 0;
block_freq = 0;
path = /slashfs_client/pauln;
output_path = /tmp;
filename = 8paeRW_1mbs;
file_size = 128m;
block_size = 4m;
thrash_lock = yes;
samedir = yes;
samefile = no;
intersperse = no;
seekoff = no;
fsync_block = no;
verify = yes;
barrier = yes;
time_block = no;
block_barrier = no;
time_barrier = no;
iterations = 1;
debug_conf = no;
debug_block = no;
debug_memory = no;
debug_buffer = no;
debug_output = no;
debug_dtree = no;
debug_barrier = no;
debug_iofunc = no;
iotests (
WriteEmUp [create:openwr:close]
statem [stat]
)
}
Feb 20, 2009
by
pauln
The fuse handlers for these calls are located in mount_slash/main.c.
Works Fs Call Handler
----- ----------- ------------
Y mount() fuse native.
Y statfs() slash2fuse_statfs()
Y creat() slash2fuse_create()
Y open() slash2fuse_open()
Y stat() slash2fuse_getattr()
Y fstat() slash2fuse_getattr()
Y mkdir() slash2fuse_mkdir()
Y readdir() slash2fuse_readdir_helper()
Y rmdir() slash2fuse_rmdir_helper()
Y unlink() slash2fuse_unlink_helper()
Y close() slash2fuse_release() / slash2fuse_releasedir()
? access() slash2fuse_access()
N read()
N write()
N readlink()
N mknod()
N symlink()
N fsync()
Feb 20, 2009
by
pauln
Every 1.0s: /usr/local/oprof/bin/opreport -l /home/pauln/Code/p... Fri Feb 20 19:02:29 2009
CPU: Core 2, speed 1861.91 MHz (estimated)
Counted CPU_CLK_UNHALTED events (Clock cycles when not halted) with a unit mask of 0x00 (Unh
alted core cycles) count 100000
samples % symbol name
281883 8.5757 fidc_child_get
172012 5.2331 psc_log_getlevel
123185 3.7476 _tands
112082 3.4099 _tands
96002 2.9207 __fidc_lookup_fg
67061 2.0402 psc_realloc
61288 1.8646 pscthr_get_canfail
52057 1.5837 .plt
50217 1.5277 libcfs_nid2str2
48670 1.4807 pscrpc_queue_wait
48245 1.4678 slash2fuse_listener_loop
46889 1.4265 slash2fuse_lookup_helper
40108 1.2202 reqlock
37342 1.1361 lnet_lookup_cookie
36247 1.1027 _tands
31848 0.9689 list_add
30684 0.9335 pscrpc_check_reply
30113 0.9161 psc_send_rpc
29668 0.9026 lnet_match_md
29663 0.9024 atomic_inc
29124 0.8860 _tands
28722 0.8738 fidc_gettime
28017 0.8524 lib_get_event
26676 0.8116 __fidc_lookup_inode
23277 0.7082 lnet_try_match_md
23163 0.7047 __pscrpc_free_req
23156 0.7045 atomic_dec_and_test
23151 0.7043 __list_add
22680 0.6900 usocklnd_read_msg
22562 0.6864 lnet_post_send_locked
22118 0.6729 atomic_dec
22031 0.6702 lnet_finalize
21960 0.6681 atomic_inc
20240 0.6158 lnet_md_unlink
19983 0.6079 ureqlock
19933 0.6064 lnet_find_peer_locked
19773 0.6016 lnet_enq_event_locked
19549 0.5947 _tands
19457 0.5919 lnet_parse
19407 0.5904 ureqlock
19382 0.5897 lnet_initialise_handle
19275 0.5864 spinlock
19076 0.5803 lib_md_build
18869 0.5741 LNetPut
18828 0.5728 lnet_return_credits_locked
18411 0.5601 LNetEQPoll
18290 0.5564 __list_add
17946 0.5460 reply_in_callback
17885 0.5441 atomic_dec
17865 0.5435 LNetMEAttach
17779 0.5409 lnet_commit_md
17153 0.5218 pscrpc_master_callback
17100 0.5202 atomic_add
16660 0.5068 usocklnd_send_tx
16440 0.5002 list_add
16058 0.4885 validlock
15911 0.4841 lnet_nid2ni_locked
15805 0.4808 list_del
15609 0.4749 slash2fuse_stat
15307 0.4657 lnet_match_blocked_msg
15144 0.4607 psc_unpack_msg
15024 0.4571 list_del
14957 0.4550 lnet_complete_msg_locked
14392 0.4378 pscrpc_prep_req_pool
13803 0.4199 __list_add
13660 0.4156 libcfs_lnd2netstrfns
12730 0.3873 after_reply
12571 0.3824 __list_add
12385 0.3768 list_empty
12356 0.3759 lnet_send
12109 0.3684 fcmh_clean_check
11929 0.3629 validlock
11847 0.3604 list_del
11730 0.3569 lnet_ni_addref_locked
11679 0.3553 usocklnd_find_peer_locked
11524 0.3506 usocklnd_create_tx
11473 0.3490 _tands